Sekiraw commited on
Commit
453c253
·
1 Parent(s): e5b71bd

Upload 11 files

Browse files
.gitattributes CHANGED
@@ -2,34 +2,27 @@
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
  *.ftz filter=lfs diff=lfs merge=lfs -text
7
  *.gz filter=lfs diff=lfs merge=lfs -text
8
  *.h5 filter=lfs diff=lfs merge=lfs -text
9
  *.joblib filter=lfs diff=lfs merge=lfs -text
10
  *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
  *.model filter=lfs diff=lfs merge=lfs -text
13
  *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
  *.onnx filter=lfs diff=lfs merge=lfs -text
17
  *.ot filter=lfs diff=lfs merge=lfs -text
18
  *.parquet filter=lfs diff=lfs merge=lfs -text
19
  *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
  *.pt filter=lfs diff=lfs merge=lfs -text
23
  *.pth filter=lfs diff=lfs merge=lfs -text
24
  *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
  *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
  *.tflite filter=lfs diff=lfs merge=lfs -text
30
  *.tgz filter=lfs diff=lfs merge=lfs -text
31
  *.wasm filter=lfs diff=lfs merge=lfs -text
32
  *.xz filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
- *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
 
5
  *.ftz filter=lfs diff=lfs merge=lfs -text
6
  *.gz filter=lfs diff=lfs merge=lfs -text
7
  *.h5 filter=lfs diff=lfs merge=lfs -text
8
  *.joblib filter=lfs diff=lfs merge=lfs -text
9
  *.lfs.* filter=lfs diff=lfs merge=lfs -text
 
10
  *.model filter=lfs diff=lfs merge=lfs -text
11
  *.msgpack filter=lfs diff=lfs merge=lfs -text
 
 
12
  *.onnx filter=lfs diff=lfs merge=lfs -text
13
  *.ot filter=lfs diff=lfs merge=lfs -text
14
  *.parquet filter=lfs diff=lfs merge=lfs -text
15
  *.pb filter=lfs diff=lfs merge=lfs -text
 
 
16
  *.pt filter=lfs diff=lfs merge=lfs -text
17
  *.pth filter=lfs diff=lfs merge=lfs -text
18
  *.rar filter=lfs diff=lfs merge=lfs -text
 
19
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
20
  *.tar.* filter=lfs diff=lfs merge=lfs -text
 
21
  *.tflite filter=lfs diff=lfs merge=lfs -text
22
  *.tgz filter=lfs diff=lfs merge=lfs -text
23
  *.wasm filter=lfs diff=lfs merge=lfs -text
24
  *.xz filter=lfs diff=lfs merge=lfs -text
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
+ *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
28
+ *.mp4 filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -1,27 +1,28 @@
1
  ---
 
2
  tags:
3
- - doom_health_gathering_supreme
4
- - reinforce
5
  - reinforcement-learning
6
- - custom-implementation
7
- - deep-rl-class
8
  model-index:
9
- - name: doom_health_gathering_supreme
10
  results:
11
- - task:
 
 
 
 
12
  type: reinforcement-learning
13
  name: reinforcement-learning
14
  dataset:
15
- name: doom_health_gathering_supreme
16
- type: doom_health_gathering_supreme
17
- metrics:
18
- - type: mean_reward
19
- value: 6
20
- name: mean_reward
21
- verified: false
22
  ---
23
 
24
- # **Reinforce** Agent playing **Pixelcopter-PLE-v0**
25
- This is a trained model of a **Reinforce** agent playing **Pixelcopter-PLE-v0** .
26
- To learn to use this model and train yours check Unit 4 of the Deep Reinforcement Learning Course: https://huggingface.co/deep-rl-course/unit4/introduction
 
 
27
 
 
1
  ---
2
+ library_name: stable-baselines3
3
  tags:
4
+ - VizdoomBasic-v0
5
+ - deep-reinforcement-learning
6
  - reinforcement-learning
7
+ - stable-baselines3
 
8
  model-index:
9
+ - name: ppo
10
  results:
11
+ - metrics:
12
+ - type: mean_reward
13
+ value: -209.90 +/- 196.26
14
+ name: mean_reward
15
+ task:
16
  type: reinforcement-learning
17
  name: reinforcement-learning
18
  dataset:
19
+ name: VizdoomBasic-v0
20
+ type: VizdoomBasic-v0
 
 
 
 
 
21
  ---
22
 
23
+ # **ppo** Agent playing **VizdoomBasic-v0**
24
+ This is a trained model of a **ppo** agent playing **VizdoomBasic-v0** using the [stable-baselines3 library](https://github.com/DLR-RM/stable-baselines3).
25
+
26
+ ## Usage (with Stable-baselines3)
27
+ TODO: Add your code
28
 
config.json ADDED
The diff for this file is too large to render. See raw diff
 
ppo-Doom.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03dcbe57ae05a5bb3660cff7d98df4461504b5639c0080939221b7893b511607
3
+ size 133
ppo-Doom/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 1.5.0
ppo-Doom/data ADDED
The diff for this file is too large to render. See raw diff
 
ppo-Doom/policy.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ff81d30317e0be4a5f36a08bc9c3c0f1a877d7b7a9fecf3c9302e23f0471f43
3
+ size 132
ppo-Doom/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5144f904b79de40add8c3bd92bc91d4416f2af5ca62a2df0944a82eae4abfdc
3
+ size 132
ppo-Doom/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99153ed9b545f0f5af916841c8510b36c9a0a84e88f412678bced8aba994b482
3
+ size 128
ppo-Doom/system_info.txt ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ OS: Linux-5.13.0-44-generic-x86_64-with-glibc2.17 #49~20.04.1-Ubuntu SMP Wed May 18 18:44:28 UTC 2022
2
+ Python: 3.8.12
3
+ Stable-Baselines3: 1.5.0
4
+ PyTorch: 1.10.2+cu102
5
+ GPU Enabled: False
6
+ Numpy: 1.22.2
7
+ Gym: 0.23.0
results.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"mean_reward": -209.9, "std_reward": 196.25771322421951, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-06-10T14:05:28.186967"}