File size: 1,908 Bytes
69915da
 
 
 
 
86744e1
 
d37eca2
9c5fada
d37eca2
69915da
86744e1
d37eca2
a4f5fb4
7d34152
e0a1ddd
69915da
 
d37eca2
 
69915da
 
 
 
 
 
9c5fada
69915da
 
 
 
 
 
 
 
 
 
86744e1
69915da
9c5fada
86744e1
 
69915da
 
d37eca2
 
69915da
d37eca2
 
69915da
 
 
 
 
 
9c5fada
69915da
 
 
 
 
 
 
 
 
 
 
 
9c5fada
69915da
 
d37eca2
69915da
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
default_settings: null
behaviors:
  SoccerTwos:
    trainer_type: poca
    hyperparameters:
      batch_size: 2048
      buffer_size: 20480
      learning_rate: 0.0002
      beta: 0.01
      epsilon: 0.25
      lambd: 0.95
      num_epoch: 3
      learning_rate_schedule: linear
      beta_schedule: linear
      epsilon_schedule: constant
    checkpoint_interval: 2000000
    network_settings:
      normalize: false
      hidden_units: 512
      num_layers: 3
      vis_encode_type: simple
      memory: null
      goal_conditioning_type: hyper
      deterministic: false
    reward_signals:
      extrinsic:
        gamma: 0.97
        strength: 1.0
        network_settings:
          normalize: false
          hidden_units: 128
          num_layers: 2
          vis_encode_type: simple
          memory: null
          goal_conditioning_type: hyper
          deterministic: false
    init_path: null
    keep_checkpoints: 2
    even_checkpoints: false
    max_steps: 1200000000
    time_horizon: 1000
    summary_freq: 100000
    threaded: false
    self_play:
      save_steps: 200000
      team_change: 200000
      swap_steps: 2000
      window: 50
      play_against_latest_model_ratio: 0.5
      initial_elo: 1200.0
    behavioral_cloning: null
env_settings:
  env_path: ml-agents/training-envs-executables/SoccerTwos/SoccerTwos.x86_64
  env_args: null
  base_port: 5005
  num_envs: 1
  num_areas: 1
  seed: -1
  max_lifetime_restarts: 10
  restarts_rate_limit_n: 1
  restarts_rate_limit_period_s: 60
engine_settings:
  width: 84
  height: 84
  quality_level: 5
  time_scale: 20
  target_frame_rate: -1
  capture_frame_rate: 60
  no_graphics: false
environment_parameters: null
checkpoint_settings:
  run_id: '0046'
  initialize_from: null
  load_model: false
  resume: true
  force: false
  train_model: false
  inference: false
  results_dir: results
torch_settings:
  device: null
debug: false