!!python/object/apply:collections.OrderedDict | |
- - - batch_size | |
- 256 | |
- - clip_range | |
- 0.4 | |
- - ent_coef | |
- 1.6077823351479547e-08 | |
- - env_wrapper | |
- - stable_baselines3.common.atari_wrappers.AtariWrapper | |
- - frame_stack | |
- 4 | |
- - gae_lambda | |
- 0.9342974216877361 | |
- - gamma | |
- 0.999 | |
- - learning_rate | |
- 0.009929843682975054 | |
- - n_envs | |
- 8 | |
- - n_epochs | |
- 9 | |
- - n_steps | |
- 128 | |
- - n_timesteps | |
- 5000000.0 | |
- - normalize | |
- false | |
- - policy | |
- CnnPolicy | |
- - policy_kwargs | |
- dict(net_arch=[dict(pi=[64, 64], vf=[64, 64]),],activation_fn=nn.Tanh) | |
- - vf_coef | |
- 0.7945615838365445 | |