!!python/object/apply:collections.OrderedDict - - - batch_size - 256 - - clip_range - 0.4 - - ent_coef - 1.6077823351479547e-08 - - env_wrapper - - stable_baselines3.common.atari_wrappers.AtariWrapper - - frame_stack - 4 - - gae_lambda - 0.9342974216877361 - - gamma - 0.999 - - learning_rate - 0.009929843682975054 - - n_envs - 8 - - n_epochs - 9 - - n_steps - 128 - - n_timesteps - 5000000.0 - - normalize - false - - policy - CnnPolicy - - policy_kwargs - dict(net_arch=[dict(pi=[64, 64], vf=[64, 64]),],activation_fn=nn.Tanh) - - vf_coef - 0.7945615838365445