AdiKompella commited on
Commit
f1babf1
·
1 Parent(s): 212632d

Initial commit

Browse files
README.md CHANGED
@@ -8,16 +8,17 @@ tags:
8
  model-index:
9
  - name: DQN
10
  results:
11
- - metrics:
12
- - type: mean_reward
13
- value: 483.50 +/- 180.71
14
- name: mean_reward
15
- task:
16
  type: reinforcement-learning
17
  name: reinforcement-learning
18
  dataset:
19
  name: SpaceInvadersNoFrameskip-v4
20
  type: SpaceInvadersNoFrameskip-v4
 
 
 
 
 
21
  ---
22
 
23
  # **DQN** Agent playing **SpaceInvadersNoFrameskip-v4**
@@ -37,20 +38,26 @@ SB3 Contrib: https://github.com/Stable-Baselines-Team/stable-baselines3-contrib
37
 
38
  ```
39
  # Download model and save it into the logs/ folder
40
- python -m utils.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga AdiKompella -f logs/
41
  python enjoy.py --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
42
  ```
43
 
 
 
 
 
 
 
44
  ## Training (with the RL Zoo)
45
  ```
46
  python train.py --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
47
  # Upload the model and generate video (when possible)
48
- python -m utils.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/ -orga AdiKompella
49
  ```
50
 
51
  ## Hyperparameters
52
  ```python
53
- OrderedDict([('batch_size', 32),
54
  ('buffer_size', 100000),
55
  ('env_wrapper',
56
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
@@ -61,7 +68,7 @@ OrderedDict([('batch_size', 32),
61
  ('learning_rate', 0.0001),
62
  ('learning_starts', 100000),
63
  ('n_timesteps', 1000000.0),
64
- ('optimize_memory_usage', True),
65
  ('policy', 'CnnPolicy'),
66
  ('target_update_interval', 1000),
67
  ('train_freq', 4),
 
8
  model-index:
9
  - name: DQN
10
  results:
11
+ - task:
 
 
 
 
12
  type: reinforcement-learning
13
  name: reinforcement-learning
14
  dataset:
15
  name: SpaceInvadersNoFrameskip-v4
16
  type: SpaceInvadersNoFrameskip-v4
17
+ metrics:
18
+ - type: mean_reward
19
+ value: 395.50 +/- 156.84
20
+ name: mean_reward
21
+ verified: false
22
  ---
23
 
24
  # **DQN** Agent playing **SpaceInvadersNoFrameskip-v4**
 
38
 
39
  ```
40
  # Download model and save it into the logs/ folder
41
+ python -m rl_zoo3.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga AdiKompella -f logs/
42
  python enjoy.py --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
43
  ```
44
 
45
+ If you installed the RL Zoo3 via pip (`pip install rl_zoo3`), from anywhere you can do:
46
+ ```
47
+ python -m rl_zoo3.load_from_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -orga AdiKompella -f logs/
48
+ rl_zoo3 enjoy --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
49
+ ```
50
+
51
  ## Training (with the RL Zoo)
52
  ```
53
  python train.py --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/
54
  # Upload the model and generate video (when possible)
55
+ python -m rl_zoo3.push_to_hub --algo dqn --env SpaceInvadersNoFrameskip-v4 -f logs/ -orga AdiKompella
56
  ```
57
 
58
  ## Hyperparameters
59
  ```python
60
+ OrderedDict([('batch_size', 64),
61
  ('buffer_size', 100000),
62
  ('env_wrapper',
63
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
 
68
  ('learning_rate', 0.0001),
69
  ('learning_starts', 100000),
70
  ('n_timesteps', 1000000.0),
71
+ ('optimize_memory_usage', False),
72
  ('policy', 'CnnPolicy'),
73
  ('target_update_interval', 1000),
74
  ('train_freq', 4),
args.yml CHANGED
@@ -1,6 +1,8 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - algo
3
  - dqn
 
 
4
  - - device
5
  - auto
6
  - - env
@@ -41,6 +43,8 @@
41
  - null
42
  - - optimize_hyperparameters
43
  - false
 
 
44
  - - pruner
45
  - median
46
  - - sampler
@@ -50,7 +54,7 @@
50
  - - save_replay_buffer
51
  - false
52
  - - seed
53
- - 3785032319
54
  - - storage
55
  - null
56
  - - study_name
@@ -73,3 +77,5 @@
73
  - null
74
  - - wandb_project_name
75
  - sb3
 
 
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - algo
3
  - dqn
4
+ - - conf_file
5
+ - null
6
  - - device
7
  - auto
8
  - - env
 
43
  - null
44
  - - optimize_hyperparameters
45
  - false
46
+ - - progress
47
+ - false
48
  - - pruner
49
  - median
50
  - - sampler
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 1833769000
58
  - - storage
59
  - null
60
  - - study_name
 
77
  - null
78
  - - wandb_project_name
79
  - sb3
80
+ - - yaml_file
81
+ - null
config.yml CHANGED
@@ -1,6 +1,6 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
- - 32
4
  - - buffer_size
5
  - 100000
6
  - - env_wrapper
@@ -20,7 +20,7 @@
20
  - - n_timesteps
21
  - 1000000.0
22
  - - optimize_memory_usage
23
- - true
24
  - - policy
25
  - CnnPolicy
26
  - - target_update_interval
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
+ - 64
4
  - - buffer_size
5
  - 100000
6
  - - env_wrapper
 
20
  - - n_timesteps
21
  - 1000000.0
22
  - - optimize_memory_usage
23
+ - false
24
  - - policy
25
  - CnnPolicy
26
  - - target_update_interval
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1dea494b1b77497c94312d1562d3d5412d86b57aabc78309ed8ccf7b1be52a62
3
- size 27222203
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f81d1a234d4fc397a5cdbefa9e9195e4d22c6338f6e2eee0c7799b0d51a6b8d
3
+ size 27224794
dqn-SpaceInvadersNoFrameskip-v4/_stable_baselines3_version CHANGED
@@ -1 +1 @@
1
- 1.5.1a8
 
1
+ 1.7.0a10
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9beb694283cffebfda6503ce18f7083dad85a0741dcafce3a772e6dec1758adc
3
- size 13503145
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d80156ddb0dc200c180c51d29d03c304950d4c6ff5f5e7703bf700bebb24c62
3
+ size 13505739
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:397402417cc7b0381c998d0d96a630b28d266a05938794a6b2e187bc0eace245
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5015934598d25e06bb579fcdeaae5f740bd67d748bfc1359a867d34b35dd861c
3
  size 13504937
dqn-SpaceInvadersNoFrameskip-v4/system_info.txt CHANGED
@@ -1,7 +1,7 @@
1
- OS: Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022
2
- Python: 3.7.13
3
- Stable-Baselines3: 1.5.1a8
4
- PyTorch: 1.11.0+cu113
5
  GPU Enabled: True
6
  Numpy: 1.21.6
7
  Gym: 0.21.0
 
1
+ OS: Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022
2
+ Python: 3.8.16
3
+ Stable-Baselines3: 1.7.0a10
4
+ PyTorch: 1.13.0+cu116
5
  GPU Enabled: True
6
  Numpy: 1.21.6
7
  Gym: 0.21.0
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2bd8591ca786dff6946ac73131701efc91cbc3db84eb5af6ddea5f12d5b67bc7
3
- size 188033
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44f33f5ab6ed5e761385e87426e2edef0d996ab375df8cd7e5925479ee3028d4
3
+ size 219303
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 483.5, "std_reward": 180.70763680597452, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-06-28T23:05:38.427677"}
 
1
+ {"mean_reward": 395.5, "std_reward": 156.83510448875916, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-12-27T00:17:04.511357"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:645878abe0df26c0c0ab326fbdb0c345c0b2ff311074fb5fedb6b9349b031d55
3
- size 36404
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaceefd27196fd4c2feb43e060a07049716a7e17b0d830edc93f49cfae51dc55
3
+ size 36613