DContrerasF commited on
Commit
c530019
1 Parent(s): 78c3dcc

Push agent to the Hub

Browse files
README.md ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - CartPole-v1
4
+ - ppo
5
+ - deep-reinforcement-learning
6
+ - reinforcement-learning
7
+ - custom-implementation
8
+ - deep-rl-course
9
+ model-index:
10
+ - name: PPO
11
+ results:
12
+ - task:
13
+ type: reinforcement-learning
14
+ name: reinforcement-learning
15
+ dataset:
16
+ name: CartPole-v1
17
+ type: CartPole-v1
18
+ metrics:
19
+ - type: mean_reward
20
+ value: 142.50 +/- 54.68
21
+ name: mean_reward
22
+ verified: false
23
+ ---
24
+
25
+ # PPO Agent Playing CartPole-v1
26
+
27
+ This is a trained model of a PPO agent playing CartPole-v1.
28
+
29
+ # Hyperparameters
30
+ ```python
31
+ {'repo_id': 'DContrerasF/ppo-own-CartPole-v1'
32
+ 'exp_name': 'ppo'
33
+ 'gym_id': 'CartPole-v1'
34
+ 'learning_rate': 0.00025
35
+ 'seed': 1
36
+ 'total_timesteps': 25000
37
+ 'torch_deterministic': True
38
+ 'cuda': True
39
+ 'track': False
40
+ 'wandb_project_name': 'DeepRL'
41
+ 'wandb_entity': None
42
+ 'capture_video': False
43
+ 'num_envs': 4
44
+ 'num_steps': 128
45
+ 'anneal_lr': True
46
+ 'gae': True
47
+ 'gamma': 0.99
48
+ 'gae_lambda': 0.95
49
+ 'num_minibatches': 4
50
+ 'update_epochs': 4
51
+ 'norm_adv': True
52
+ 'clip_coef': 0.2
53
+ 'clip_vloss': True
54
+ 'ent_coef': 0.01
55
+ 'vf_coef': 0.5
56
+ 'max_grad_norm': 0.5
57
+ 'target_kl': None
58
+ 'batch_size': 512
59
+ 'minibatch_size': 128}
60
+ ```
61
+
logs/events.out.tfevents.1700240223.dl-workstation.3760873.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:baa0180f3b7d99b2dc2b66904cb741af10525166c49d0bf4d3f0c85d472339df
3
+ size 126518
logs/events.out.tfevents.1700240494.dl-workstation.3763087.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:153de31d56cef06a072efa189075322267549bc6f952008113e53a4ec73fbba9
3
+ size 53466
logs/events.out.tfevents.1700240531.dl-workstation.3763505.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a26f173c3249b79d45f1bd6422f4b10d8e3fc34660c0c405e0a37ff4fe6a4bdf
3
+ size 46319
logs/events.out.tfevents.1700240575.dl-workstation.3764013.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eea7109fbd6954884582a2cb5781b7bcf2c19e354856ed568be48c619f6b3754
3
+ size 52117
logs/events.out.tfevents.1700240649.dl-workstation.3764836.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:831e5edf37b5b9b652cc5ff992934dc4cbd816d97f903b8689228897d49cd2b9
3
+ size 54569
logs/events.out.tfevents.1700240933.dl-workstation.3767278.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fcdd0acacb29b00bd2f3e763cff984f05cde285ec08efdfd1b4f5544c568e8d
3
+ size 51235
logs/events.out.tfevents.1700241374.dl-workstation.3770717.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14a7a0e687de0f8bd28ef6a6e1ebab15343020e28c3258dc55111143ce69fd25
3
+ size 3568
logs/events.out.tfevents.1700241405.dl-workstation.3771104.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21bbd1fb3df2ad90451758af3452e9cbcff0d4460a4ea16852bf746e68cd8ffb
3
+ size 3568
logs/events.out.tfevents.1700241414.dl-workstation.3771346.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56776bd85ede565feeefa0465e3231e23f1fd9e995802b1eb7d1a603a424fb5f
3
+ size 3568
logs/events.out.tfevents.1700241428.dl-workstation.3771637.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c82235984ad8d2afd8437bea6ad97c69a676b2b47643a0f9ba924b7da1ef38c0
3
+ size 3568
logs/events.out.tfevents.1700241470.dl-workstation.3772096.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f58e305ed79651761004a1940ba2d6aeacbfcddc6b2474de756b1493975760a5
3
+ size 76770
logs/events.out.tfevents.1700241776.dl-workstation.3774646.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c788b28096dc7fc0473f046276c6532be20df5d16fe58c4397e32161b30d009e
3
+ size 82064
logs/events.out.tfevents.1700241906.dl-workstation.3775956.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f856e4dae1993f2fcfec69f2f970c1d4530b0b8bc2e43ebc3bf720e30714f6ca
3
+ size 75179
logs/events.out.tfevents.1700241950.dl-workstation.3776419.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12d67424618004cf159d0087d401022aa5654b43f58de6ae319e00761b4b7f07
3
+ size 73803
logs/events.out.tfevents.1700242010.dl-workstation.3776961.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5cd4c79009c4cc6861712abfe0ea6a78af20124b65ad1417b8248f88f4516cb
3
+ size 73823
logs/events.out.tfevents.1700242037.dl-workstation.3777282.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:068df2e7cf6487b74e9c0f805e3b66cf5aba4b13d94b3631980c7f8f1e2ce00c
3
+ size 73085
logs/events.out.tfevents.1700242096.dl-workstation.3778070.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57a39629e79533b60e41da6fa1ac40e77247890e8c54c4f26edd814991e93cc6
3
+ size 71633
model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37b6cc041d7f4ae4a726cb3b4a58b05b5eed60afc86b6850d6c843718cbc9248
3
+ size 40466
replay.mp4 ADDED
Binary file (10.8 kB). View file
 
results.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"env_id": "CartPole-v1", "mean_reward": 142.5, "std_reward": 54.675863047600814, "n_evaluation_episodes": 10, "eval_datetime": "2023-11-17T17:28:29.318552"}