!!python/object/apply:collections.OrderedDict | |
- - - batch_size | |
- 32 | |
- - clip_range | |
- 0.3 | |
- - ent_coef | |
- 3.62109e-06 | |
- - gae_lambda | |
- 0.9 | |
- - gamma | |
- 0.99 | |
- - learning_rate | |
- 2.55673e-05 | |
- - max_grad_norm | |
- 0.7 | |
- - n_envs | |
- 1 | |
- - n_epochs | |
- 20 | |
- - n_steps | |
- 512 | |
- - n_timesteps | |
- 10000000.0 | |
- - normalize | |
- true | |
- - policy | |
- MlpPolicy | |
- - policy_kwargs | |
- dict( log_std_init=-2, ortho_init=False, activation_fn=nn.ReLU, net_arch=dict(pi=[256, | |
256], vf=[256, 256]) ) | |
- - vf_coef | |
- 0.430793 | |