p3nGu1nZz commited on
Commit
fba91ab
·
1 Parent(s): f048d67

added latest ppo runs A1, A2, and A3. Each used 500, 2500, and 4800 training messages respectively. no other settings or config was modified.

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. results/tau_agent_ppo_A1_2M/Tau-A1-PPO-1M.onnx +3 -0
  2. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1199744.onnx +3 -0
  3. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1199744.pt +3 -0
  4. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1299958.onnx +3 -0
  5. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1299958.pt +3 -0
  6. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1399744.onnx +3 -0
  7. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1399744.pt +3 -0
  8. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1499776.onnx +3 -0
  9. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1499776.pt +3 -0
  10. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1599808.onnx +3 -0
  11. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1599808.pt +3 -0
  12. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1699840.onnx +3 -0
  13. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1699840.pt +3 -0
  14. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1799808.onnx +3 -0
  15. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1799808.pt +3 -0
  16. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1899840.onnx +3 -0
  17. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1899840.pt +3 -0
  18. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1999872.onnx +3 -0
  19. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1999872.pt +3 -0
  20. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-2005504.onnx +3 -0
  21. results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-2005504.pt +3 -0
  22. results/tau_agent_ppo_A1_2M/TauAgent/checkpoint.pt +3 -0
  23. results/tau_agent_ppo_A1_2M/configuration.yaml +93 -0
  24. results/tau_agent_ppo_A2_2M/Tau-A2-PPO-1M.onnx +3 -0
  25. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1199868.onnx +3 -0
  26. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1199868.pt +3 -0
  27. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1299820.onnx +3 -0
  28. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1299820.pt +3 -0
  29. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1399844.onnx +3 -0
  30. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1399844.pt +3 -0
  31. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1499868.onnx +3 -0
  32. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1499868.pt +3 -0
  33. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1599820.onnx +3 -0
  34. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1599820.pt +3 -0
  35. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1699844.onnx +3 -0
  36. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1699844.pt +3 -0
  37. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1799868.onnx +3 -0
  38. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1799868.pt +3 -0
  39. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1899820.onnx +3 -0
  40. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1899820.pt +3 -0
  41. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1999844.onnx +3 -0
  42. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1999844.pt +3 -0
  43. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-2001380.onnx +3 -0
  44. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-2001380.pt +3 -0
  45. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-2691.onnx +3 -0
  46. results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-2691.pt +3 -0
  47. results/tau_agent_ppo_A2_2M/TauAgent/checkpoint.pt +3 -0
  48. results/tau_agent_ppo_A2_2M/configuration.yaml +93 -0
  49. results/tau_agent_ppo_A3_2M/Tau-A3-PPO-1M.onnx +3 -0
  50. results/tau_agent_ppo_A3_2M/TauAgent/TauAgent-1199856.onnx +3 -0
results/tau_agent_ppo_A1_2M/Tau-A1-PPO-1M.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08931e19cffa93c14fed86e9bb88278424715303928d4761bf3dcc257fdde73d
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1199744.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b24d7a70f3f708362ccd3b35ccbf309d81696c379a5c2111810676ffda6c9c3d
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1199744.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f556a11f0fea58e2cc679cf2f9ad6e86403425ced6496f25188080f8f29bc8e
3
+ size 15534256
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1299958.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb6f5d1ee696b00963d7cb00a10b924fdf123f5eb46b618ba006117c7d843919
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1299958.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c0244046f46126c14c82f60ef46b799325fb0f35205cec04ccec9141784a93c
3
+ size 15534256
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1399744.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d0b419212303e89f05b6d735d04bb392166df4dd491fd0036ea2fce40a3abd6
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1399744.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c120a1fa8108b6b9558d9667fe949808b3e16394d499693e20392d2ea1f6c28e
3
+ size 15534256
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1499776.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f424ea2d9e633119050d04d95e1079bee5e8c3a1a9fee31282ca95855bd7d885
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1499776.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:912696d11a6837fc71783e311bed38195e1dda57fe4123a64141db5e96083ba3
3
+ size 15534256
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1599808.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56f777fafa9cc0919950a0231834f75954a17c4e07b9bcf7c6b2b3dbc5426c41
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1599808.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f311e89bfe1d1fa8a578efe91d9ceafece8fa50a349a0721013634ff0e664ef9
3
+ size 15534256
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1699840.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90533537979d9abeb815e499a777474c4c0c66e3068c3e9de39c17512f6cd35c
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1699840.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09f5ead3bb039e49e211a2ca8d7afa788223c1ed2b9883342efc46ef66799982
3
+ size 15534256
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1799808.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de1ea3ba5c8d90ce7be467ee2871441c2dbb220e8761d14b8c3d70439bc9ad7b
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1799808.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32def0f45b71e638ddd1ad302b620df2526e4099b0bc65c9f4b1ec7a2737b092
3
+ size 15534256
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1899840.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9677e46c8e368b0e5f5a3aa982ca3949bf1f4489fa58ae55cea8801e56563aba
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1899840.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9cacd7cdf76e019c35c7618a719b7c58d5b468f7a47d136dc4d1dcea7ede6b7
3
+ size 15534256
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1999872.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eb6959372271405f646cec449cddcc6d19f604a7d02b5422b02aa7035aa9906
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-1999872.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc7b6a20afe2601acf9523584f01e56a6a62f274dff5066b5b53ae4621953aa
3
+ size 15534256
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-2005504.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08931e19cffa93c14fed86e9bb88278424715303928d4761bf3dcc257fdde73d
3
+ size 2186395
results/tau_agent_ppo_A1_2M/TauAgent/TauAgent-2005504.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:260196c3491aca9156c57f3d29bba9cb40b9655acd53407f09075f191df035ae
3
+ size 15534256
results/tau_agent_ppo_A1_2M/TauAgent/checkpoint.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37080da1574efbcf39b5938261f36738c44437f2ceb72501058d86a7ffe8d386
3
+ size 15533332
results/tau_agent_ppo_A1_2M/configuration.yaml ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ default_settings: null
2
+ behaviors:
3
+ TauAgent:
4
+ trainer_type: ppo
5
+ hyperparameters:
6
+ batch_size: 256
7
+ buffer_size: 4096
8
+ learning_rate: 3.0e-05
9
+ beta: 0.005
10
+ epsilon: 0.2
11
+ lambd: 0.95
12
+ num_epoch: 7
13
+ shared_critic: false
14
+ learning_rate_schedule: linear
15
+ beta_schedule: linear
16
+ epsilon_schedule: linear
17
+ checkpoint_interval: 100000
18
+ network_settings:
19
+ normalize: true
20
+ hidden_units: 256
21
+ num_layers: 4
22
+ vis_encode_type: simple
23
+ memory:
24
+ sequence_length: 256
25
+ memory_size: 256
26
+ goal_conditioning_type: hyper
27
+ deterministic: false
28
+ reward_signals:
29
+ extrinsic:
30
+ gamma: 0.99
31
+ strength: 1.0
32
+ network_settings:
33
+ normalize: false
34
+ hidden_units: 128
35
+ num_layers: 2
36
+ vis_encode_type: simple
37
+ memory: null
38
+ goal_conditioning_type: hyper
39
+ deterministic: false
40
+ curiosity:
41
+ gamma: 0.995
42
+ strength: 0.1
43
+ network_settings:
44
+ normalize: true
45
+ hidden_units: 256
46
+ num_layers: 4
47
+ vis_encode_type: simple
48
+ memory: null
49
+ goal_conditioning_type: hyper
50
+ deterministic: false
51
+ learning_rate: 0.0003
52
+ encoding_size: null
53
+ init_path: null
54
+ keep_checkpoints: 10
55
+ even_checkpoints: false
56
+ max_steps: 2000000
57
+ time_horizon: 256
58
+ summary_freq: 10000
59
+ threaded: true
60
+ self_play: null
61
+ behavioral_cloning: null
62
+ env_settings:
63
+ env_path: .\Build
64
+ env_args: null
65
+ base_port: 5005
66
+ num_envs: 1
67
+ num_areas: 1
68
+ timeout_wait: 300
69
+ seed: -1
70
+ max_lifetime_restarts: 10
71
+ restarts_rate_limit_n: 1
72
+ restarts_rate_limit_period_s: 60
73
+ engine_settings:
74
+ width: 84
75
+ height: 84
76
+ quality_level: 5
77
+ time_scale: 20
78
+ target_frame_rate: -1
79
+ capture_frame_rate: 60
80
+ no_graphics: false
81
+ environment_parameters: null
82
+ checkpoint_settings:
83
+ run_id: tau_agent_ppo_A1
84
+ initialize_from: null
85
+ load_model: false
86
+ resume: false
87
+ force: true
88
+ train_model: false
89
+ inference: false
90
+ results_dir: results
91
+ torch_settings:
92
+ device: cuda
93
+ debug: false
results/tau_agent_ppo_A2_2M/Tau-A2-PPO-1M.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0398c964e34982251733242637984c7f01c824d098f526c1be6faebd4210d87
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1199868.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:135d63df9d0d0b736354fe26cf96eb27fd528a6b78cfdd9261e9d37eaa07645a
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1199868.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c267a9eff45dba057281c3d9a1425e46bdecdff480356e90b9a354b73267d4c
3
+ size 15534256
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1299820.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb3f9db35c9e2a17516579b7d7a10cfabca5f8ce8fc35f610f6e31e5c31116d6
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1299820.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a27f22154179dd27cc60dcbfa1bb369e610739ff25e5325a6da7cc47927dd772
3
+ size 15534256
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1399844.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b6fa40c7cf1be40ae83a0da94b1c67a3392dc6d7c3d10ba0ee824563040f498
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1399844.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef4ded635e0f2d7a408f2b0ba43dcd353527645b494b8339717c0c6beb023e9e
3
+ size 15534256
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1499868.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bde1956a288922cd17553dfb3027b65840d6766d70e1558e55116dc4b7e0b148
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1499868.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43fd0bcbe8f220bdf21da53f0f40477cfdf85dcedd5d8722f1a901da6d5fe185
3
+ size 15534256
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1599820.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ee9e2c05daba2b0b5254c288c3706cb814ced4c31f1e088fabeda28094eee28
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1599820.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59f02f3bb74ce6e76abd70f9be17c895ed9e87262a9fdf3fbf981dd81966da3d
3
+ size 15534256
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1699844.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b254dcda11ad3360337459541fbe1eb03658c8424f83cb672ad4a11f42b512a5
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1699844.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef765287b85642373bb594a04833b1180ceb9bcc66442aba2f59192f9e7982e3
3
+ size 15534256
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1799868.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28a0be07927cd17bbd3f5417c7b84a0cc7c4c3dd4e09336ba95f5dfda77c271f
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1799868.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f21e737f0a400fce4dce9099c6991ff915b47c002776aa5ab2f63c382969a4e8
3
+ size 15534256
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1899820.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebef6bb98b397cc3a0db618129077e2eb0c5040b350017cbdfbe41fa4df5a6de
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1899820.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e04a0c1478dfcfcfe86eba2a77040340db266c8436cb89bd95132882ce71455
3
+ size 15534256
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1999844.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cdd31e9ab7c20921ac634bda0d154b8d0e9071e7b6c1291574057ff756f79ad
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-1999844.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f6dc7e8db3a95f24d80f52fc0d66d4f04b9eb7ce550f9fa9f5acba467eedc02
3
+ size 15534256
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-2001380.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0398c964e34982251733242637984c7f01c824d098f526c1be6faebd4210d87
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-2001380.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f02d4d44874d0d318cc7234de23203bc8c69afd8e8c79835e02f7901c5f3eea
3
+ size 15534256
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-2691.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ef1367f89737191e33e79e4b9dca4bf87dcfe0ca8d867b3680469fd7f204799
3
+ size 2186395
results/tau_agent_ppo_A2_2M/TauAgent/TauAgent-2691.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:965410fd6c5f389dab95a0384ab8bac2123d68b30ec893866d6d579980c9ee37
3
+ size 15533794
results/tau_agent_ppo_A2_2M/TauAgent/checkpoint.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55deb589e17065ca91cc72c3f4cac41e7ed505b3f1f1e6761063687bdfbbb9df
3
+ size 15533332
results/tau_agent_ppo_A2_2M/configuration.yaml ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ default_settings: null
2
+ behaviors:
3
+ TauAgent:
4
+ trainer_type: ppo
5
+ hyperparameters:
6
+ batch_size: 256
7
+ buffer_size: 4096
8
+ learning_rate: 3.0e-05
9
+ beta: 0.005
10
+ epsilon: 0.2
11
+ lambd: 0.95
12
+ num_epoch: 7
13
+ shared_critic: false
14
+ learning_rate_schedule: linear
15
+ beta_schedule: linear
16
+ epsilon_schedule: linear
17
+ checkpoint_interval: 100000
18
+ network_settings:
19
+ normalize: true
20
+ hidden_units: 256
21
+ num_layers: 4
22
+ vis_encode_type: simple
23
+ memory:
24
+ sequence_length: 256
25
+ memory_size: 256
26
+ goal_conditioning_type: hyper
27
+ deterministic: false
28
+ reward_signals:
29
+ extrinsic:
30
+ gamma: 0.99
31
+ strength: 1.0
32
+ network_settings:
33
+ normalize: false
34
+ hidden_units: 128
35
+ num_layers: 2
36
+ vis_encode_type: simple
37
+ memory: null
38
+ goal_conditioning_type: hyper
39
+ deterministic: false
40
+ curiosity:
41
+ gamma: 0.995
42
+ strength: 0.1
43
+ network_settings:
44
+ normalize: true
45
+ hidden_units: 256
46
+ num_layers: 4
47
+ vis_encode_type: simple
48
+ memory: null
49
+ goal_conditioning_type: hyper
50
+ deterministic: false
51
+ learning_rate: 0.0003
52
+ encoding_size: null
53
+ init_path: null
54
+ keep_checkpoints: 10
55
+ even_checkpoints: false
56
+ max_steps: 2000000
57
+ time_horizon: 256
58
+ summary_freq: 10000
59
+ threaded: true
60
+ self_play: null
61
+ behavioral_cloning: null
62
+ env_settings:
63
+ env_path: .\Build
64
+ env_args: null
65
+ base_port: 5005
66
+ num_envs: 1
67
+ num_areas: 1
68
+ timeout_wait: 300
69
+ seed: -1
70
+ max_lifetime_restarts: 10
71
+ restarts_rate_limit_n: 1
72
+ restarts_rate_limit_period_s: 60
73
+ engine_settings:
74
+ width: 84
75
+ height: 84
76
+ quality_level: 5
77
+ time_scale: 20
78
+ target_frame_rate: -1
79
+ capture_frame_rate: 60
80
+ no_graphics: false
81
+ environment_parameters: null
82
+ checkpoint_settings:
83
+ run_id: tau_agent_ppo_A2
84
+ initialize_from: null
85
+ load_model: false
86
+ resume: false
87
+ force: true
88
+ train_model: false
89
+ inference: false
90
+ results_dir: results
91
+ torch_settings:
92
+ device: cuda
93
+ debug: false
results/tau_agent_ppo_A3_2M/Tau-A3-PPO-1M.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4415d030673efd5e6692cbfbac1618956704cea501fda3c152b3308e875a94e4
3
+ size 2186395
results/tau_agent_ppo_A3_2M/TauAgent/TauAgent-1199856.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:033766d0894fd21885177d13966ff23817ba7843978f6bcc24cb1a4352983f64
3
+ size 2186395