{"mean_reward": 19340.0, "std_reward": 862.7137416316028, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-06-27T01:06:57.012393"} |
{"mean_reward": 19340.0, "std_reward": 862.7137416316028, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-06-27T01:06:57.012393"} |