tqc-PandaReach-v3 / config.yml
Chenchen Liu
Initial commit
cedf395
raw
history blame contribute delete
517 Bytes
!!python/object/apply:collections.OrderedDict
- - - batch_size
- 256
- - buffer_size
- 1000000
- - ent_coef
- auto
- - gamma
- 0.95
- - learning_rate
- 0.001
- - learning_starts
- 1000
- - n_timesteps
- 20000.0
- - normalize
- true
- - policy
- MultiInputPolicy
- - policy_kwargs
- dict(net_arch=[64, 64], n_critics=1)
- - replay_buffer_class
- HerReplayBuffer
- - replay_buffer_kwargs
- dict( goal_selection_strategy='future', n_sampled_goal=4 )