DereWah commited on
Commit
b8d8584
1 Parent(s): aef211b

Upload 54 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. lr/config/agent/lr.yaml +59 -0
  2. lr/config/env/lr.yaml +7 -0
  3. lr/config/trainer.yaml +105 -0
  4. lr/config/world_model_env/default.yaml +27 -0
  5. lr/config/world_model_env/fast.yaml +27 -0
  6. lr/model/lr.pt +3 -0
  7. lr/spawn/0/act.npy +3 -0
  8. lr/spawn/0/full_res.npy +3 -0
  9. lr/spawn/0/full_res_0.png +0 -0
  10. lr/spawn/0/full_res_1.png +0 -0
  11. lr/spawn/0/full_res_2.png +0 -0
  12. lr/spawn/0/full_res_3.png +0 -0
  13. lr/spawn/0/low_res.npy +3 -0
  14. lr/spawn/0/next_act.npy +3 -0
  15. lr/spawn/1/act.npy +3 -0
  16. lr/spawn/1/full_res.npy +3 -0
  17. lr/spawn/1/full_res_0.png +0 -0
  18. lr/spawn/1/full_res_1.png +0 -0
  19. lr/spawn/1/full_res_2.png +0 -0
  20. lr/spawn/1/full_res_3.png +0 -0
  21. lr/spawn/1/low_res.npy +3 -0
  22. lr/spawn/1/next_act.npy +3 -0
  23. lr/spawn/2/act.npy +3 -0
  24. lr/spawn/2/full_res.npy +3 -0
  25. lr/spawn/2/full_res_0.png +0 -0
  26. lr/spawn/2/full_res_1.png +0 -0
  27. lr/spawn/2/full_res_2.png +0 -0
  28. lr/spawn/2/full_res_3.png +0 -0
  29. lr/spawn/2/low_res.npy +3 -0
  30. lr/spawn/2/next_act.npy +3 -0
  31. lr/spawn/3/act.npy +3 -0
  32. lr/spawn/3/full_res.npy +3 -0
  33. lr/spawn/3/full_res_0.png +0 -0
  34. lr/spawn/3/full_res_1.png +0 -0
  35. lr/spawn/3/full_res_2.png +0 -0
  36. lr/spawn/3/full_res_3.png +0 -0
  37. lr/spawn/3/low_res.npy +3 -0
  38. lr/spawn/3/next_act.npy +3 -0
  39. lr/spawn/4/act.npy +3 -0
  40. lr/spawn/4/full_res.npy +3 -0
  41. lr/spawn/4/full_res_0.png +0 -0
  42. lr/spawn/4/full_res_1.png +0 -0
  43. lr/spawn/4/full_res_2.png +0 -0
  44. lr/spawn/4/full_res_3.png +0 -0
  45. lr/spawn/4/low_res.npy +3 -0
  46. lr/spawn/4/next_act.npy +3 -0
  47. lr/spawn/5/act.npy +3 -0
  48. lr/spawn/5/full_res.npy +3 -0
  49. lr/spawn/5/full_res_0.png +0 -0
  50. lr/spawn/5/full_res_1.png +0 -0
lr/config/agent/lr.yaml ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _target_: agent.AgentConfig
2
+
3
+ denoiser:
4
+ _target_: models.diffusion.DenoiserConfig
5
+ sigma_data: 0.5
6
+ sigma_offset_noise: 0.1
7
+ noise_previous_obs: true
8
+ upsampling_factor: null
9
+ inner_model:
10
+ _target_: models.diffusion.InnerModelConfig
11
+ img_channels: 3
12
+ num_steps_conditioning: 4
13
+ cond_channels: 2048
14
+ depths:
15
+ - 2
16
+ - 2
17
+ - 2
18
+ - 2
19
+ channels:
20
+ - 128
21
+ - 256
22
+ - 512
23
+ - 1024
24
+ attn_depths:
25
+ - 0
26
+ - 0
27
+ - 1
28
+ - 1
29
+
30
+ upsampler:
31
+ _target_: models.diffusion.DenoiserConfig
32
+ sigma_data: 0.5
33
+ sigma_offset_noise: 0.1
34
+ noise_previous_obs: false
35
+ upsampling_factor: 5
36
+ inner_model:
37
+ _target_: models.diffusion.InnerModelConfig
38
+ img_channels: 3
39
+ num_steps_conditioning: 1
40
+ cond_channels: 2048
41
+ depths:
42
+ - 2
43
+ - 2
44
+ - 2
45
+ - 2
46
+ channels:
47
+ - 64
48
+ - 64
49
+ - 128
50
+ - 256
51
+ attn_depths:
52
+ - 0
53
+ - 0
54
+ - 0
55
+ - 1
56
+
57
+ rew_end_model: null
58
+
59
+ actor_critic: null
lr/config/env/lr.yaml ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ train:
2
+ id: lr
3
+ size: [320, 240]
4
+ num_actions: 22
5
+ path_data_low_res: C:\Users\ifrat\Documents\AI-SM64\MarioKart\colab-diamond-csgo\processed\low_res
6
+ path_data_full_res: C:\Users\ifrat\Documents\AI-SM64\MarioKart\colab-diamond-csgo\processed\full_res
7
+ keymap: mk64
lr/config/trainer.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ defaults:
2
+ - _self_
3
+ - env: lr
4
+ - agent: lr
5
+ - world_model_env: default
6
+
7
+ hydra:
8
+ job:
9
+ chdir: True
10
+
11
+ wandb:
12
+ mode: disabled
13
+ project: null
14
+ entity: null
15
+ name: null
16
+ group: null
17
+ tags: null
18
+ notes: null
19
+
20
+ initialization:
21
+ path_to_ckpt: null
22
+ load_denoiser: True
23
+ load_rew_end_model: True
24
+ load_actor_critic: True
25
+
26
+ common:
27
+ devices: all # int, list of int, cpu, or all
28
+ seed: null
29
+ resume: False # do not modify, set by scripts/resume.sh only.
30
+
31
+ checkpointing:
32
+ save_agent_every: 5
33
+ num_to_keep: 11 # number of checkpoints to keep, use null to disable
34
+
35
+ collection:
36
+ train:
37
+ num_envs: 1
38
+ epsilon: 0.01
39
+ num_steps_total: 100000
40
+ first_epoch:
41
+ min: 5000
42
+ max: 10000 # null: no maximum
43
+ threshold_rew: 10
44
+ steps_per_epoch: 100
45
+ test:
46
+ num_envs: 1
47
+ num_episodes: 4
48
+ epsilon: 0.0
49
+ num_final_episodes: 100
50
+
51
+ static_dataset:
52
+ path: ${env.path_data_low_res}
53
+ ignore_sample_weights: True
54
+
55
+ training:
56
+ should: True
57
+ num_final_epochs: 1500
58
+ cache_in_ram: False
59
+ num_workers_data_loaders: 4
60
+ model_free: False # if True, turn off world_model training and RL in imagination
61
+ compile_wm: False
62
+
63
+ evaluation:
64
+ should: True
65
+ every: 20
66
+
67
+ denoiser:
68
+ training:
69
+ num_autoregressive_steps: 4
70
+ start_after_epochs: 0
71
+ steps_first_epoch: 100
72
+ steps_per_epoch: 100
73
+ sample_weights: null
74
+ batch_size: 14
75
+ grad_acc_steps: 1
76
+ lr_warmup_steps: 100
77
+ max_grad_norm: 10.0
78
+
79
+ optimizer:
80
+ lr: 1e-4
81
+ weight_decay: 1e-2
82
+ eps: 1e-8
83
+
84
+ sigma_distribution: # log normal distribution for sigma during training
85
+ _target_: models.diffusion.SigmaDistributionConfig
86
+ loc: -1.2
87
+ scale: 1.2
88
+ sigma_min: 2e-3
89
+ sigma_max: 20
90
+
91
+ upsampler:
92
+ training:
93
+ num_autoregressive_steps: 1
94
+ start_after_epochs: 0
95
+ steps_first_epoch: 400
96
+ steps_per_epoch: 400
97
+ sample_weights: null
98
+ batch_size: 14
99
+ grad_acc_steps: 1
100
+ lr_warmup_steps: 100
101
+ max_grad_norm: 10.0
102
+
103
+ optimizer: ${denoiser.optimizer}
104
+ sigma_distribution: ${denoiser.sigma_distribution}
105
+
lr/config/world_model_env/default.yaml ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _target_: envs.WorldModelEnvConfig
2
+ horizon: 1000
3
+ num_batches_to_preload: 256
4
+ diffusion_sampler_next_obs:
5
+ _target_: models.diffusion.DiffusionSamplerConfig
6
+ num_steps_denoising: 3
7
+ sigma_min: 2e-3
8
+ sigma_max: 5.0
9
+ rho: 7
10
+ order: 1 # 1: Euler, 2: Heun
11
+ s_churn: 0.0 # Amount of stochasticity
12
+ s_tmin: 0.0
13
+ s_tmax: ${eval:'float("inf")'}
14
+ s_noise: 1.0
15
+ s_cond: 0.005
16
+ diffusion_sampler_upsampling:
17
+ _target_: models.diffusion.DiffusionSamplerConfig
18
+ num_steps_denoising: 10
19
+ sigma_min: 1
20
+ sigma_max: 5.0
21
+ rho: 7
22
+ order: 1 # 1: Euler, 2: Heun
23
+ s_churn: 10.0 # Amount of stochasticity
24
+ s_tmin: 1
25
+ s_tmax: 5
26
+ s_noise: 0.9
27
+ s_cond: 0
lr/config/world_model_env/fast.yaml ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _target_: envs.WorldModelEnvConfig
2
+ horizon: 1000
3
+ num_batches_to_preload: 256
4
+ diffusion_sampler_next_obs:
5
+ _target_: models.diffusion.DiffusionSamplerConfig
6
+ num_steps_denoising: 1
7
+ sigma_min: 2e-3
8
+ sigma_max: 5.0
9
+ rho: 7
10
+ order: 1 # 1: Euler, 2: Heun
11
+ s_churn: 0.0 # Amount of stochasticity
12
+ s_tmin: 0.0
13
+ s_tmax: ${eval:'float("inf")'}
14
+ s_noise: 1.0
15
+ s_cond: 0.005
16
+ diffusion_sampler_upsampling:
17
+ _target_: models.diffusion.DiffusionSamplerConfig
18
+ num_steps_denoising: 1
19
+ sigma_min: 1
20
+ sigma_max: 5.0
21
+ rho: 7
22
+ order: 2 # 1: Euler, 2: Heun
23
+ s_churn: 10.0 # Amount of stochasticity
24
+ s_tmin: 1
25
+ s_tmax: 5
26
+ s_noise: 0.9
27
+ s_cond: 0
lr/model/lr.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe47c5cde02a98696c859b13c5465d5ffff40beb49a949fa0f0af6169792df35
3
+ size 1526764802
lr/spawn/0/act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e6b54abb6a227046f7114400a6d974a98af861a1af4ac75561f05f510b43a38
3
+ size 832
lr/spawn/0/full_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bcd09b70cdd05575d35f6ab03063656e410b58a1774965f2b9bb87dd0fd5961
3
+ size 921728
lr/spawn/0/full_res_0.png ADDED
lr/spawn/0/full_res_1.png ADDED
lr/spawn/0/full_res_2.png ADDED
lr/spawn/0/full_res_3.png ADDED
lr/spawn/0/low_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24a5f3b0431e721997eff0e460143c305835aa20f7d3fdd789733b259e3cb1ae
3
+ size 36992
lr/spawn/0/next_act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6089160fa80a66a24e585cae89e18acb3821b88c925bc439340610f68ea6dab1
3
+ size 35328
lr/spawn/1/act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04e943309c82eff98f08ab529807f8219258134192c3acc23e832f2bfdd9050b
3
+ size 832
lr/spawn/1/full_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecfb16a7186c367b8026db7eb0774c150a751d2b598871f386eec6529d7bf912
3
+ size 921728
lr/spawn/1/full_res_0.png ADDED
lr/spawn/1/full_res_1.png ADDED
lr/spawn/1/full_res_2.png ADDED
lr/spawn/1/full_res_3.png ADDED
lr/spawn/1/low_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b4f67a1457fc5d006272429f2987f0fba78396562173c1520d9c563c00c8a97
3
+ size 36992
lr/spawn/1/next_act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c878f42c4bca734b0a70a17cf510929c05a42cc2cfbe52f40476e1a42f24a1af
3
+ size 35328
lr/spawn/2/act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3c13c96524e58e1b00e9a0bbb3c5b68e8cae77fa1ea9598e79dc1eacd2e5390
3
+ size 832
lr/spawn/2/full_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86b57a277b40e4e8e442b9b9d74a2389030693c4ccb95dd7e387cdc48d955ca7
3
+ size 921728
lr/spawn/2/full_res_0.png ADDED
lr/spawn/2/full_res_1.png ADDED
lr/spawn/2/full_res_2.png ADDED
lr/spawn/2/full_res_3.png ADDED
lr/spawn/2/low_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:970c663025a0531202d614b5187398089b0c44c29fbfc119016af78d8756682e
3
+ size 36992
lr/spawn/2/next_act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:016f0856b4bbd5d13d186ff9ff605b401e5b7add023650b6db5a60d919ba0897
3
+ size 35328
lr/spawn/3/act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efb0df54cd99534aef36df080396848ca7e9ae86ec1ffca0d70374319d149e1b
3
+ size 832
lr/spawn/3/full_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9335b4af0460f42cfa39a5cf5490f76f545cecefc038dac6ca49c46c219526da
3
+ size 921728
lr/spawn/3/full_res_0.png ADDED
lr/spawn/3/full_res_1.png ADDED
lr/spawn/3/full_res_2.png ADDED
lr/spawn/3/full_res_3.png ADDED
lr/spawn/3/low_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c755aa63db40943eda78cf4b36fa215f2909c2ec0dfed271cd043f35a1720f20
3
+ size 36992
lr/spawn/3/next_act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:016f0856b4bbd5d13d186ff9ff605b401e5b7add023650b6db5a60d919ba0897
3
+ size 35328
lr/spawn/4/act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a236d4f2de3e30d288571feaf4d200accbf21ecbb80166bebedc133a6872aff
3
+ size 832
lr/spawn/4/full_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb4e5fe827c42960bc577ffc4ce3d6c562ce0f029c7611e96c016278f67f9b14
3
+ size 921728
lr/spawn/4/full_res_0.png ADDED
lr/spawn/4/full_res_1.png ADDED
lr/spawn/4/full_res_2.png ADDED
lr/spawn/4/full_res_3.png ADDED
lr/spawn/4/low_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7a3c21f957ca13720ceccdb1f5468684bae8dd956ba39f621ff992d967bca3a
3
+ size 36992
lr/spawn/4/next_act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91571ad5a0e807de76ad530ab5e7362b68ea565a5c5e66e471166dbef9580226
3
+ size 35328
lr/spawn/5/act.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75dde68d3f361792f175ffa223162e6ec49c6a1e569babd1987a997ed47a6803
3
+ size 832
lr/spawn/5/full_res.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2aeb1dd9b46c1ff832bb96dc064c11ec0f78524df588c9f8005e99cf045c305
3
+ size 921728
lr/spawn/5/full_res_0.png ADDED
lr/spawn/5/full_res_1.png ADDED