TheoVincent commited on
Commit
ab7c3b9
·
1 Parent(s): 1da1c7d

refine config.json

Browse files
Files changed (1) hide show
  1. config.json +6 -5
config.json CHANGED
@@ -11,19 +11,20 @@
11
  "ending_eps": 0.01,
12
  "duration_eps": 250000,
13
  "batch_size": 32,
14
- "n_step_return": 5,
15
  "---- i-DQN ---": "----------------------------",
16
  "idqn_learning_rate": 6.25e-5,
17
  "idqn_optimizer_eps": 1.5e-4,
18
- "idqn_n_training_steps_per_target_update": 3000000,
19
- "idqn_n_training_steps_per_rolling_step": 8000,
 
20
  "idqn_head_behaviorial_policy": "uniform",
21
  "idqn_shared_network": true,
22
  "---- i-IQN ---": "----------------------------",
23
  "iiqn_learning_rate": 0.00005,
24
  "iiqn_optimizer_eps": 0.0003125,
25
- "iiqn_n_training_steps_per_target_update": 3000000,
26
- "iiqn_n_training_steps_per_rolling_step": 8000,
 
27
  "iiqn_head_behaviorial_policy": "uniform",
28
  "iiqn_n_quantiles_policy": 32,
29
  "iiqn_n_quantiles": 64,
 
11
  "ending_eps": 0.01,
12
  "duration_eps": 250000,
13
  "batch_size": 32,
 
14
  "---- i-DQN ---": "----------------------------",
15
  "idqn_learning_rate": 6.25e-5,
16
  "idqn_optimizer_eps": 1.5e-4,
17
+ "idqn_n_step_return": 1,
18
+ "idqn_n_training_steps_per_target_update": 30,
19
+ "idqn_n_training_steps_per_window_shift": 6000,
20
  "idqn_head_behaviorial_policy": "uniform",
21
  "idqn_shared_network": true,
22
  "---- i-IQN ---": "----------------------------",
23
  "iiqn_learning_rate": 0.00005,
24
  "iiqn_optimizer_eps": 0.0003125,
25
+ "iiqn_n_step_return": 3,
26
+ "iiqn_n_training_steps_per_target_update": 30,
27
+ "iiqn_n_training_steps_per_window_shift": 6000,
28
  "iiqn_head_behaviorial_policy": "uniform",
29
  "iiqn_n_quantiles_policy": 32,
30
  "iiqn_n_quantiles": 64,