File size: 1,908 Bytes
69915da 86744e1 d37eca2 9c5fada d37eca2 69915da 86744e1 d37eca2 a4f5fb4 7d34152 e0a1ddd 69915da d37eca2 69915da 9c5fada 69915da 86744e1 69915da 9c5fada 86744e1 69915da d37eca2 69915da d37eca2 69915da 9c5fada 69915da 9c5fada 69915da d37eca2 69915da |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 |
default_settings: null
behaviors:
SoccerTwos:
trainer_type: poca
hyperparameters:
batch_size: 2048
buffer_size: 20480
learning_rate: 0.0002
beta: 0.01
epsilon: 0.25
lambd: 0.95
num_epoch: 3
learning_rate_schedule: linear
beta_schedule: linear
epsilon_schedule: constant
checkpoint_interval: 2000000
network_settings:
normalize: false
hidden_units: 512
num_layers: 3
vis_encode_type: simple
memory: null
goal_conditioning_type: hyper
deterministic: false
reward_signals:
extrinsic:
gamma: 0.97
strength: 1.0
network_settings:
normalize: false
hidden_units: 128
num_layers: 2
vis_encode_type: simple
memory: null
goal_conditioning_type: hyper
deterministic: false
init_path: null
keep_checkpoints: 2
even_checkpoints: false
max_steps: 1200000000
time_horizon: 1000
summary_freq: 100000
threaded: false
self_play:
save_steps: 200000
team_change: 200000
swap_steps: 2000
window: 50
play_against_latest_model_ratio: 0.5
initial_elo: 1200.0
behavioral_cloning: null
env_settings:
env_path: ml-agents/training-envs-executables/SoccerTwos/SoccerTwos.x86_64
env_args: null
base_port: 5005
num_envs: 1
num_areas: 1
seed: -1
max_lifetime_restarts: 10
restarts_rate_limit_n: 1
restarts_rate_limit_period_s: 60
engine_settings:
width: 84
height: 84
quality_level: 5
time_scale: 20
target_frame_rate: -1
capture_frame_rate: 60
no_graphics: false
environment_parameters: null
checkpoint_settings:
run_id: '0046'
initialize_from: null
load_model: false
resume: true
force: false
train_model: false
inference: false
results_dir: results
torch_settings:
device: null
debug: false
|