MattStammers commited on
Commit
c8b3c39
1 Parent(s): fe999d8

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: BreakoutNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 574.30 +/- 179.99
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: BreakoutNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 488.40 +/- 209.36
20
  name: mean_reward
21
  verified: false
22
  ---
ppo-BreakoutNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae451631e4077aea9d92d8a0f1da8914ab31684a526f34cef067227beb0538a3
3
- size 20425207
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9161db146af8f42d06cb0ce72412df424a5d3f973e6c0a11d114edaa730dc2fa
3
+ size 20425210
ppo-BreakoutNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
ppo-BreakoutNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1ed6dc80e773e710e9bc696e554604099657e6c76e164a2f02c9a6cf1b07030
3
  size 13502841
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bfcc3567da90372b5e46b4da0c43a54aa379c912a79c48ee2a6c6eeeeec05d5
3
  size 13502841
ppo-BreakoutNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8cb3d29db66a183879de56c028f73db34dce80e7a3be49004586e89a3a5b0107
3
  size 6753345
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb274df75cbcd6d2f3aac9e7a5dc58a00b8edc4efbb2067071c6267a5f6da61c
3
  size 6753345
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8bb06b4db1a387b05e0bb792236b69d92c5d00d198d9bf39871cc71175a50a32
3
- size 783638
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b84c9e0b644cf444ecbb46d5121264da69c2e4eda7cdcd633fa4b2ddf96e574
3
+ size 83106
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 574.3, "std_reward": 179.99447213734092, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-09-06T16:48:39.451486"}
 
1
+ {"mean_reward": 488.4, "std_reward": 209.35720670662377, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-09-11T20:33:45.283863"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52affd2d64995dd6554573b76132da5f96a8a633da2b94d8d41cadbf6cdf998a
3
- size 882777
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f32ac0d59a31c8804653d806133977507ee96e2a5ece7c3aede30f76d028051
3
+ size 1229031