MattStammers commited on
Commit
78f7a65
1 Parent(s): 9a48df1

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: BreakoutNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 472.40 +/- 113.77
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: BreakoutNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 574.30 +/- 179.99
20
  name: mean_reward
21
  verified: false
22
  ---
ppo-BreakoutNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:963780344b17f59a767b8bac2cb3f4d2ef0427596a6957b30b8ba04cbc28a0a9
3
  size 20425207
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae451631e4077aea9d92d8a0f1da8914ab31684a526f34cef067227beb0538a3
3
  size 20425207
ppo-BreakoutNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
ppo-BreakoutNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e02e5a6e6ede9837baf29a0f74bddff2317a4e9b7a77c09b95a59b14821ee0e8
3
  size 13502841
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1ed6dc80e773e710e9bc696e554604099657e6c76e164a2f02c9a6cf1b07030
3
  size 13502841
ppo-BreakoutNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d31f6dac049c0d0fca351fa5b8cd2d1b525b93f0ab8568978ccd8b06592b047b
3
  size 6753345
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cb3d29db66a183879de56c028f73db34dce80e7a3be49004586e89a3a5b0107
3
  size 6753345
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ce440f439c4baf4bc9e5030d17977d8506b2a61d73944d3787ee8327684a887
3
- size 80488
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:192413b341f00c180aec2f9e9abb2c419a1cdb20fb6b2c1ac19c37f790a0e722
3
+ size 74522
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 472.4, "std_reward": 113.7718770171258, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-09-06T07:49:22.187719"}
 
1
+ {"mean_reward": 574.3, "std_reward": 179.99447213734092, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-09-06T16:48:39.451486"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3de41f1eb3a0bc03b20c8813a78d20aedc6962404980c751dfdf744dc0986a61
3
- size 807724
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52affd2d64995dd6554573b76132da5f96a8a633da2b94d8d41cadbf6cdf998a
3
+ size 882777