pushing model
Browse files- README.md +1 -1
- events.out.tfevents.1668621727.pop-os.1063627.0 +3 -0
- events.out.tfevents.1668621728.pop-os.1063627.1 +3 -0
- pyproject.toml +96 -0
- replay.mp4 +0 -0
- videos/CartPole-v1__dqn__1__1668621727-eval/rl-video-episode-0.mp4 +0 -0
- videos/CartPole-v1__dqn__1__1668621727-eval/rl-video-episode-1.mp4 +0 -0
- videos/CartPole-v1__dqn__1__1668621727-eval/rl-video-episode-8.mp4 +0 -0
README.md
CHANGED
@@ -30,7 +30,7 @@ found [here](https://github.com/vwxyzjn/cleanrl/blob/master/cleanrl/dqn.py).
|
|
30 |
|
31 |
```bash
|
32 |
curl -OL https://huggingface.co/vwxyzjn/CartPole-v1-dqn-seed1/raw/main/dqn.py
|
33 |
-
python
|
34 |
```
|
35 |
|
36 |
# Hyperparameters
|
|
|
30 |
|
31 |
```bash
|
32 |
curl -OL https://huggingface.co/vwxyzjn/CartPole-v1-dqn-seed1/raw/main/dqn.py
|
33 |
+
python dqn.py --cuda False --save-model --upload-model --total-timesteps 500
|
34 |
```
|
35 |
|
36 |
# Hyperparameters
|
events.out.tfevents.1668621727.pop-os.1063627.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:830b02670954a8f05f7e96b7966dd827f8bd7206f70e7ef00bb70a9b1e1c447a
|
3 |
+
size 1805
|
events.out.tfevents.1668621728.pop-os.1063627.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4c417780d8220d5655af10b0d08bf71d9ea42beb2b1087f355555cd052abbe6
|
3 |
+
size 618
|
pyproject.toml
ADDED
@@ -0,0 +1,96 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[tool.poetry]
|
2 |
+
name = "cleanrl"
|
3 |
+
version = "1.0.0b2"
|
4 |
+
description = "High-quality single file implementation of Deep Reinforcement Learning algorithms with research-friendly features"
|
5 |
+
authors = ["Costa Huang <[email protected]>"]
|
6 |
+
include = ["cleanrl_utils"]
|
7 |
+
keywords = ["reinforcement", "machine", "learning", "research"]
|
8 |
+
license="MIT"
|
9 |
+
readme = "README.md"
|
10 |
+
|
11 |
+
[tool.poetry.dependencies]
|
12 |
+
python = ">=3.7.1,<3.10"
|
13 |
+
tensorboard = "^2.10.0"
|
14 |
+
wandb = "^0.13.3"
|
15 |
+
gym = {version = "0.23.1", extras = ["classic_control"]}
|
16 |
+
torch = "^1.12.1"
|
17 |
+
stable-baselines3 = "1.2.0"
|
18 |
+
|
19 |
+
[tool.poetry.group.dev.dependencies]
|
20 |
+
pre-commit = "^2.20.0"
|
21 |
+
|
22 |
+
[tool.poetry.group.atari]
|
23 |
+
optional = true
|
24 |
+
[tool.poetry.group.atari.dependencies]
|
25 |
+
ale-py = "0.7.4"
|
26 |
+
AutoROM = {extras = ["accept-rom-license"], version = "^0.4.2"}
|
27 |
+
opencv-python = "^4.6.0.66"
|
28 |
+
|
29 |
+
[tool.poetry.group.pybullet]
|
30 |
+
optional = true
|
31 |
+
[tool.poetry.group.pybullet.dependencies]
|
32 |
+
pybullet = "3.1.8"
|
33 |
+
|
34 |
+
[tool.poetry.group.procgen]
|
35 |
+
optional = true
|
36 |
+
[tool.poetry.group.procgen.dependencies]
|
37 |
+
procgen = "^0.10.7"
|
38 |
+
|
39 |
+
[tool.poetry.group.pytest]
|
40 |
+
optional = true
|
41 |
+
[tool.poetry.group.pytest.dependencies]
|
42 |
+
pytest = "^7.1.3"
|
43 |
+
|
44 |
+
[tool.poetry.group.mujoco]
|
45 |
+
optional = true
|
46 |
+
[tool.poetry.group.mujoco.dependencies]
|
47 |
+
free-mujoco-py = "^2.1.6"
|
48 |
+
|
49 |
+
[tool.poetry.group.docs]
|
50 |
+
optional = true
|
51 |
+
[tool.poetry.group.docs.dependencies]
|
52 |
+
mkdocs-material = "^8.4.3"
|
53 |
+
markdown-include = "^0.7.0"
|
54 |
+
|
55 |
+
[tool.poetry.group.jax]
|
56 |
+
optional = true
|
57 |
+
[tool.poetry.group.jax.dependencies]
|
58 |
+
jax = "^0.3.17"
|
59 |
+
jaxlib = "^0.3.15"
|
60 |
+
flax = "^0.6.0"
|
61 |
+
|
62 |
+
[tool.poetry.group.optuna]
|
63 |
+
optional = true
|
64 |
+
[tool.poetry.group.optuna.dependencies]
|
65 |
+
optuna = "^3.0.1"
|
66 |
+
optuna-dashboard = "^0.7.2"
|
67 |
+
rich = "<12.0"
|
68 |
+
|
69 |
+
[tool.poetry.group.envpool]
|
70 |
+
optional = true
|
71 |
+
[tool.poetry.group.envpool.dependencies]
|
72 |
+
envpool = "^0.6.4"
|
73 |
+
|
74 |
+
[tool.poetry.group.pettingzoo]
|
75 |
+
optional = true
|
76 |
+
[tool.poetry.group.pettingzoo.dependencies]
|
77 |
+
PettingZoo = "1.18.1"
|
78 |
+
SuperSuit = "3.4.0"
|
79 |
+
multi-agent-ale-py = "0.1.11"
|
80 |
+
|
81 |
+
|
82 |
+
[tool.poetry.group.cloud]
|
83 |
+
optional = true
|
84 |
+
[tool.poetry.group.cloud.dependencies]
|
85 |
+
boto3 = "^1.24.70"
|
86 |
+
awscli = "^1.25.71"
|
87 |
+
|
88 |
+
[tool.poetry.group.isaacgym]
|
89 |
+
optional = true
|
90 |
+
[tool.poetry.group.isaacgym.dependencies]
|
91 |
+
isaacgymenvs = {git = "https://github.com/vwxyzjn/IsaacGymEnvs.git", rev = "poetry"}
|
92 |
+
isaacgym = {path = "cleanrl/ppo_continuous_action_isaacgym/isaacgym", develop = true}
|
93 |
+
|
94 |
+
[build-system]
|
95 |
+
requires = ["poetry-core"]
|
96 |
+
build-backend = "poetry.core.masonry.api"
|
replay.mp4
ADDED
Binary file (10.8 kB). View file
|
|
videos/CartPole-v1__dqn__1__1668621727-eval/rl-video-episode-0.mp4
ADDED
Binary file (12.6 kB). View file
|
|
videos/CartPole-v1__dqn__1__1668621727-eval/rl-video-episode-1.mp4
ADDED
Binary file (8.84 kB). View file
|
|
videos/CartPole-v1__dqn__1__1668621727-eval/rl-video-episode-8.mp4
ADDED
Binary file (10.8 kB). View file
|
|