Upload 54 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- lr/config/agent/lr.yaml +59 -0
- lr/config/env/lr.yaml +7 -0
- lr/config/trainer.yaml +105 -0
- lr/config/world_model_env/default.yaml +27 -0
- lr/config/world_model_env/fast.yaml +27 -0
- lr/model/lr.pt +3 -0
- lr/spawn/0/act.npy +3 -0
- lr/spawn/0/full_res.npy +3 -0
- lr/spawn/0/full_res_0.png +0 -0
- lr/spawn/0/full_res_1.png +0 -0
- lr/spawn/0/full_res_2.png +0 -0
- lr/spawn/0/full_res_3.png +0 -0
- lr/spawn/0/low_res.npy +3 -0
- lr/spawn/0/next_act.npy +3 -0
- lr/spawn/1/act.npy +3 -0
- lr/spawn/1/full_res.npy +3 -0
- lr/spawn/1/full_res_0.png +0 -0
- lr/spawn/1/full_res_1.png +0 -0
- lr/spawn/1/full_res_2.png +0 -0
- lr/spawn/1/full_res_3.png +0 -0
- lr/spawn/1/low_res.npy +3 -0
- lr/spawn/1/next_act.npy +3 -0
- lr/spawn/2/act.npy +3 -0
- lr/spawn/2/full_res.npy +3 -0
- lr/spawn/2/full_res_0.png +0 -0
- lr/spawn/2/full_res_1.png +0 -0
- lr/spawn/2/full_res_2.png +0 -0
- lr/spawn/2/full_res_3.png +0 -0
- lr/spawn/2/low_res.npy +3 -0
- lr/spawn/2/next_act.npy +3 -0
- lr/spawn/3/act.npy +3 -0
- lr/spawn/3/full_res.npy +3 -0
- lr/spawn/3/full_res_0.png +0 -0
- lr/spawn/3/full_res_1.png +0 -0
- lr/spawn/3/full_res_2.png +0 -0
- lr/spawn/3/full_res_3.png +0 -0
- lr/spawn/3/low_res.npy +3 -0
- lr/spawn/3/next_act.npy +3 -0
- lr/spawn/4/act.npy +3 -0
- lr/spawn/4/full_res.npy +3 -0
- lr/spawn/4/full_res_0.png +0 -0
- lr/spawn/4/full_res_1.png +0 -0
- lr/spawn/4/full_res_2.png +0 -0
- lr/spawn/4/full_res_3.png +0 -0
- lr/spawn/4/low_res.npy +3 -0
- lr/spawn/4/next_act.npy +3 -0
- lr/spawn/5/act.npy +3 -0
- lr/spawn/5/full_res.npy +3 -0
- lr/spawn/5/full_res_0.png +0 -0
- lr/spawn/5/full_res_1.png +0 -0
lr/config/agent/lr.yaml
ADDED
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_target_: agent.AgentConfig
|
2 |
+
|
3 |
+
denoiser:
|
4 |
+
_target_: models.diffusion.DenoiserConfig
|
5 |
+
sigma_data: 0.5
|
6 |
+
sigma_offset_noise: 0.1
|
7 |
+
noise_previous_obs: true
|
8 |
+
upsampling_factor: null
|
9 |
+
inner_model:
|
10 |
+
_target_: models.diffusion.InnerModelConfig
|
11 |
+
img_channels: 3
|
12 |
+
num_steps_conditioning: 4
|
13 |
+
cond_channels: 2048
|
14 |
+
depths:
|
15 |
+
- 2
|
16 |
+
- 2
|
17 |
+
- 2
|
18 |
+
- 2
|
19 |
+
channels:
|
20 |
+
- 128
|
21 |
+
- 256
|
22 |
+
- 512
|
23 |
+
- 1024
|
24 |
+
attn_depths:
|
25 |
+
- 0
|
26 |
+
- 0
|
27 |
+
- 1
|
28 |
+
- 1
|
29 |
+
|
30 |
+
upsampler:
|
31 |
+
_target_: models.diffusion.DenoiserConfig
|
32 |
+
sigma_data: 0.5
|
33 |
+
sigma_offset_noise: 0.1
|
34 |
+
noise_previous_obs: false
|
35 |
+
upsampling_factor: 5
|
36 |
+
inner_model:
|
37 |
+
_target_: models.diffusion.InnerModelConfig
|
38 |
+
img_channels: 3
|
39 |
+
num_steps_conditioning: 1
|
40 |
+
cond_channels: 2048
|
41 |
+
depths:
|
42 |
+
- 2
|
43 |
+
- 2
|
44 |
+
- 2
|
45 |
+
- 2
|
46 |
+
channels:
|
47 |
+
- 64
|
48 |
+
- 64
|
49 |
+
- 128
|
50 |
+
- 256
|
51 |
+
attn_depths:
|
52 |
+
- 0
|
53 |
+
- 0
|
54 |
+
- 0
|
55 |
+
- 1
|
56 |
+
|
57 |
+
rew_end_model: null
|
58 |
+
|
59 |
+
actor_critic: null
|
lr/config/env/lr.yaml
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
train:
|
2 |
+
id: lr
|
3 |
+
size: [320, 240]
|
4 |
+
num_actions: 22
|
5 |
+
path_data_low_res: C:\Users\ifrat\Documents\AI-SM64\MarioKart\colab-diamond-csgo\processed\low_res
|
6 |
+
path_data_full_res: C:\Users\ifrat\Documents\AI-SM64\MarioKart\colab-diamond-csgo\processed\full_res
|
7 |
+
keymap: mk64
|
lr/config/trainer.yaml
ADDED
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
defaults:
|
2 |
+
- _self_
|
3 |
+
- env: lr
|
4 |
+
- agent: lr
|
5 |
+
- world_model_env: default
|
6 |
+
|
7 |
+
hydra:
|
8 |
+
job:
|
9 |
+
chdir: True
|
10 |
+
|
11 |
+
wandb:
|
12 |
+
mode: disabled
|
13 |
+
project: null
|
14 |
+
entity: null
|
15 |
+
name: null
|
16 |
+
group: null
|
17 |
+
tags: null
|
18 |
+
notes: null
|
19 |
+
|
20 |
+
initialization:
|
21 |
+
path_to_ckpt: null
|
22 |
+
load_denoiser: True
|
23 |
+
load_rew_end_model: True
|
24 |
+
load_actor_critic: True
|
25 |
+
|
26 |
+
common:
|
27 |
+
devices: all # int, list of int, cpu, or all
|
28 |
+
seed: null
|
29 |
+
resume: False # do not modify, set by scripts/resume.sh only.
|
30 |
+
|
31 |
+
checkpointing:
|
32 |
+
save_agent_every: 5
|
33 |
+
num_to_keep: 11 # number of checkpoints to keep, use null to disable
|
34 |
+
|
35 |
+
collection:
|
36 |
+
train:
|
37 |
+
num_envs: 1
|
38 |
+
epsilon: 0.01
|
39 |
+
num_steps_total: 100000
|
40 |
+
first_epoch:
|
41 |
+
min: 5000
|
42 |
+
max: 10000 # null: no maximum
|
43 |
+
threshold_rew: 10
|
44 |
+
steps_per_epoch: 100
|
45 |
+
test:
|
46 |
+
num_envs: 1
|
47 |
+
num_episodes: 4
|
48 |
+
epsilon: 0.0
|
49 |
+
num_final_episodes: 100
|
50 |
+
|
51 |
+
static_dataset:
|
52 |
+
path: ${env.path_data_low_res}
|
53 |
+
ignore_sample_weights: True
|
54 |
+
|
55 |
+
training:
|
56 |
+
should: True
|
57 |
+
num_final_epochs: 1500
|
58 |
+
cache_in_ram: False
|
59 |
+
num_workers_data_loaders: 4
|
60 |
+
model_free: False # if True, turn off world_model training and RL in imagination
|
61 |
+
compile_wm: False
|
62 |
+
|
63 |
+
evaluation:
|
64 |
+
should: True
|
65 |
+
every: 20
|
66 |
+
|
67 |
+
denoiser:
|
68 |
+
training:
|
69 |
+
num_autoregressive_steps: 4
|
70 |
+
start_after_epochs: 0
|
71 |
+
steps_first_epoch: 100
|
72 |
+
steps_per_epoch: 100
|
73 |
+
sample_weights: null
|
74 |
+
batch_size: 14
|
75 |
+
grad_acc_steps: 1
|
76 |
+
lr_warmup_steps: 100
|
77 |
+
max_grad_norm: 10.0
|
78 |
+
|
79 |
+
optimizer:
|
80 |
+
lr: 1e-4
|
81 |
+
weight_decay: 1e-2
|
82 |
+
eps: 1e-8
|
83 |
+
|
84 |
+
sigma_distribution: # log normal distribution for sigma during training
|
85 |
+
_target_: models.diffusion.SigmaDistributionConfig
|
86 |
+
loc: -1.2
|
87 |
+
scale: 1.2
|
88 |
+
sigma_min: 2e-3
|
89 |
+
sigma_max: 20
|
90 |
+
|
91 |
+
upsampler:
|
92 |
+
training:
|
93 |
+
num_autoregressive_steps: 1
|
94 |
+
start_after_epochs: 0
|
95 |
+
steps_first_epoch: 400
|
96 |
+
steps_per_epoch: 400
|
97 |
+
sample_weights: null
|
98 |
+
batch_size: 14
|
99 |
+
grad_acc_steps: 1
|
100 |
+
lr_warmup_steps: 100
|
101 |
+
max_grad_norm: 10.0
|
102 |
+
|
103 |
+
optimizer: ${denoiser.optimizer}
|
104 |
+
sigma_distribution: ${denoiser.sigma_distribution}
|
105 |
+
|
lr/config/world_model_env/default.yaml
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_target_: envs.WorldModelEnvConfig
|
2 |
+
horizon: 1000
|
3 |
+
num_batches_to_preload: 256
|
4 |
+
diffusion_sampler_next_obs:
|
5 |
+
_target_: models.diffusion.DiffusionSamplerConfig
|
6 |
+
num_steps_denoising: 3
|
7 |
+
sigma_min: 2e-3
|
8 |
+
sigma_max: 5.0
|
9 |
+
rho: 7
|
10 |
+
order: 1 # 1: Euler, 2: Heun
|
11 |
+
s_churn: 0.0 # Amount of stochasticity
|
12 |
+
s_tmin: 0.0
|
13 |
+
s_tmax: ${eval:'float("inf")'}
|
14 |
+
s_noise: 1.0
|
15 |
+
s_cond: 0.005
|
16 |
+
diffusion_sampler_upsampling:
|
17 |
+
_target_: models.diffusion.DiffusionSamplerConfig
|
18 |
+
num_steps_denoising: 10
|
19 |
+
sigma_min: 1
|
20 |
+
sigma_max: 5.0
|
21 |
+
rho: 7
|
22 |
+
order: 1 # 1: Euler, 2: Heun
|
23 |
+
s_churn: 10.0 # Amount of stochasticity
|
24 |
+
s_tmin: 1
|
25 |
+
s_tmax: 5
|
26 |
+
s_noise: 0.9
|
27 |
+
s_cond: 0
|
lr/config/world_model_env/fast.yaml
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_target_: envs.WorldModelEnvConfig
|
2 |
+
horizon: 1000
|
3 |
+
num_batches_to_preload: 256
|
4 |
+
diffusion_sampler_next_obs:
|
5 |
+
_target_: models.diffusion.DiffusionSamplerConfig
|
6 |
+
num_steps_denoising: 1
|
7 |
+
sigma_min: 2e-3
|
8 |
+
sigma_max: 5.0
|
9 |
+
rho: 7
|
10 |
+
order: 1 # 1: Euler, 2: Heun
|
11 |
+
s_churn: 0.0 # Amount of stochasticity
|
12 |
+
s_tmin: 0.0
|
13 |
+
s_tmax: ${eval:'float("inf")'}
|
14 |
+
s_noise: 1.0
|
15 |
+
s_cond: 0.005
|
16 |
+
diffusion_sampler_upsampling:
|
17 |
+
_target_: models.diffusion.DiffusionSamplerConfig
|
18 |
+
num_steps_denoising: 1
|
19 |
+
sigma_min: 1
|
20 |
+
sigma_max: 5.0
|
21 |
+
rho: 7
|
22 |
+
order: 2 # 1: Euler, 2: Heun
|
23 |
+
s_churn: 10.0 # Amount of stochasticity
|
24 |
+
s_tmin: 1
|
25 |
+
s_tmax: 5
|
26 |
+
s_noise: 0.9
|
27 |
+
s_cond: 0
|
lr/model/lr.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe47c5cde02a98696c859b13c5465d5ffff40beb49a949fa0f0af6169792df35
|
3 |
+
size 1526764802
|
lr/spawn/0/act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e6b54abb6a227046f7114400a6d974a98af861a1af4ac75561f05f510b43a38
|
3 |
+
size 832
|
lr/spawn/0/full_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bcd09b70cdd05575d35f6ab03063656e410b58a1774965f2b9bb87dd0fd5961
|
3 |
+
size 921728
|
lr/spawn/0/full_res_0.png
ADDED
lr/spawn/0/full_res_1.png
ADDED
lr/spawn/0/full_res_2.png
ADDED
lr/spawn/0/full_res_3.png
ADDED
lr/spawn/0/low_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24a5f3b0431e721997eff0e460143c305835aa20f7d3fdd789733b259e3cb1ae
|
3 |
+
size 36992
|
lr/spawn/0/next_act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6089160fa80a66a24e585cae89e18acb3821b88c925bc439340610f68ea6dab1
|
3 |
+
size 35328
|
lr/spawn/1/act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04e943309c82eff98f08ab529807f8219258134192c3acc23e832f2bfdd9050b
|
3 |
+
size 832
|
lr/spawn/1/full_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecfb16a7186c367b8026db7eb0774c150a751d2b598871f386eec6529d7bf912
|
3 |
+
size 921728
|
lr/spawn/1/full_res_0.png
ADDED
lr/spawn/1/full_res_1.png
ADDED
lr/spawn/1/full_res_2.png
ADDED
lr/spawn/1/full_res_3.png
ADDED
lr/spawn/1/low_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b4f67a1457fc5d006272429f2987f0fba78396562173c1520d9c563c00c8a97
|
3 |
+
size 36992
|
lr/spawn/1/next_act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c878f42c4bca734b0a70a17cf510929c05a42cc2cfbe52f40476e1a42f24a1af
|
3 |
+
size 35328
|
lr/spawn/2/act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3c13c96524e58e1b00e9a0bbb3c5b68e8cae77fa1ea9598e79dc1eacd2e5390
|
3 |
+
size 832
|
lr/spawn/2/full_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86b57a277b40e4e8e442b9b9d74a2389030693c4ccb95dd7e387cdc48d955ca7
|
3 |
+
size 921728
|
lr/spawn/2/full_res_0.png
ADDED
lr/spawn/2/full_res_1.png
ADDED
lr/spawn/2/full_res_2.png
ADDED
lr/spawn/2/full_res_3.png
ADDED
lr/spawn/2/low_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:970c663025a0531202d614b5187398089b0c44c29fbfc119016af78d8756682e
|
3 |
+
size 36992
|
lr/spawn/2/next_act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:016f0856b4bbd5d13d186ff9ff605b401e5b7add023650b6db5a60d919ba0897
|
3 |
+
size 35328
|
lr/spawn/3/act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efb0df54cd99534aef36df080396848ca7e9ae86ec1ffca0d70374319d149e1b
|
3 |
+
size 832
|
lr/spawn/3/full_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9335b4af0460f42cfa39a5cf5490f76f545cecefc038dac6ca49c46c219526da
|
3 |
+
size 921728
|
lr/spawn/3/full_res_0.png
ADDED
lr/spawn/3/full_res_1.png
ADDED
lr/spawn/3/full_res_2.png
ADDED
lr/spawn/3/full_res_3.png
ADDED
lr/spawn/3/low_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c755aa63db40943eda78cf4b36fa215f2909c2ec0dfed271cd043f35a1720f20
|
3 |
+
size 36992
|
lr/spawn/3/next_act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:016f0856b4bbd5d13d186ff9ff605b401e5b7add023650b6db5a60d919ba0897
|
3 |
+
size 35328
|
lr/spawn/4/act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a236d4f2de3e30d288571feaf4d200accbf21ecbb80166bebedc133a6872aff
|
3 |
+
size 832
|
lr/spawn/4/full_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb4e5fe827c42960bc577ffc4ce3d6c562ce0f029c7611e96c016278f67f9b14
|
3 |
+
size 921728
|
lr/spawn/4/full_res_0.png
ADDED
lr/spawn/4/full_res_1.png
ADDED
lr/spawn/4/full_res_2.png
ADDED
lr/spawn/4/full_res_3.png
ADDED
lr/spawn/4/low_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7a3c21f957ca13720ceccdb1f5468684bae8dd956ba39f621ff992d967bca3a
|
3 |
+
size 36992
|
lr/spawn/4/next_act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91571ad5a0e807de76ad530ab5e7362b68ea565a5c5e66e471166dbef9580226
|
3 |
+
size 35328
|
lr/spawn/5/act.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75dde68d3f361792f175ffa223162e6ec49c6a1e569babd1987a997ed47a6803
|
3 |
+
size 832
|
lr/spawn/5/full_res.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2aeb1dd9b46c1ff832bb96dc064c11ec0f78524df588c9f8005e99cf045c305
|
3 |
+
size 921728
|
lr/spawn/5/full_res_0.png
ADDED
lr/spawn/5/full_res_1.png
ADDED