pepijn223 HF staff commited on
Commit
1691d18
·
verified ·
1 Parent(s): b7932b0

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. config.json +24 -21
  3. config.yaml +27 -37
  4. model.safetensors +2 -2
README.md CHANGED
@@ -1,10 +1,10 @@
1
  ---
2
  library_name: lerobot
3
  tags:
 
4
  - model_hub_mixin
5
  - pytorch_model_hub_mixin
6
  - robotics
7
- - vqbet
8
  ---
9
 
10
  This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
 
1
  ---
2
  library_name: lerobot
3
  tags:
4
+ - diffusion-policy
5
  - model_hub_mixin
6
  - pytorch_model_hub_mixin
7
  - robotics
 
8
  ---
9
 
10
  This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
config.json CHANGED
@@ -1,18 +1,22 @@
1
  {
2
- "action_chunk_size": 5,
3
- "bet_softmax_temperature": 0.1,
 
 
 
4
  "crop_is_random": true,
5
  "crop_shape": [
6
  84,
7
  84
8
  ],
9
- "dropout": 0.1,
10
- "gpt_block_size": 500,
11
- "gpt_hidden_dim": 512,
12
- "gpt_input_dim": 512,
13
- "gpt_n_head": 8,
14
- "gpt_n_layer": 8,
15
- "gpt_output_dim": 512,
 
16
  "input_normalization_modes": {
17
  "observation.image": "mean_std",
18
  "observation.state": "min_max"
@@ -27,11 +31,13 @@
27
  2
28
  ]
29
  },
30
- "mlp_hidden_dim": 1024,
31
- "n_action_pred_token": 7,
32
- "n_obs_steps": 5,
33
- "n_vqvae_training_steps": 20000,
34
- "offset_loss_weight": 10000.0,
 
 
35
  "output_normalization_modes": {
36
  "action": "min_max"
37
  },
@@ -40,14 +46,11 @@
40
  2
41
  ]
42
  },
 
43
  "pretrained_backbone_weights": null,
44
- "primary_code_loss_weight": 5.0,
45
- "secondary_code_loss_weight": 0.5,
46
- "sequentially_select": false,
47
  "spatial_softmax_num_keypoints": 32,
 
48
  "use_group_norm": true,
49
- "vision_backbone": "resnet18",
50
- "vqvae_embedding_dim": 256,
51
- "vqvae_enc_hidden_dim": 128,
52
- "vqvae_n_embed": 16
53
  }
 
1
  {
2
+ "beta_end": 0.02,
3
+ "beta_schedule": "squaredcos_cap_v2",
4
+ "beta_start": 0.0001,
5
+ "clip_sample": true,
6
+ "clip_sample_range": 1.0,
7
  "crop_is_random": true,
8
  "crop_shape": [
9
  84,
10
  84
11
  ],
12
+ "diffusion_step_embed_dim": 128,
13
+ "do_mask_loss_for_padding": false,
14
+ "down_dims": [
15
+ 512,
16
+ 1024,
17
+ 2048
18
+ ],
19
+ "horizon": 16,
20
  "input_normalization_modes": {
21
  "observation.image": "mean_std",
22
  "observation.state": "min_max"
 
31
  2
32
  ]
33
  },
34
+ "kernel_size": 5,
35
+ "n_action_steps": 8,
36
+ "n_groups": 8,
37
+ "n_obs_steps": 2,
38
+ "noise_scheduler_type": "DDPM",
39
+ "num_inference_steps": null,
40
+ "num_train_timesteps": 100,
41
  "output_normalization_modes": {
42
  "action": "min_max"
43
  },
 
46
  2
47
  ]
48
  },
49
+ "prediction_type": "epsilon",
50
  "pretrained_backbone_weights": null,
 
 
 
51
  "spatial_softmax_num_keypoints": 32,
52
+ "use_film_scale_modulation": true,
53
  "use_group_norm": true,
54
+ "use_separate_rgb_encoder_per_camera": false,
55
+ "vision_backbone": "resnet18"
 
 
56
  }
config.yaml CHANGED
@@ -59,30 +59,14 @@ training:
59
  - 0.999
60
  adam_eps: 1.0e-08
61
  adam_weight_decay: 1.0e-06
62
- vqvae_lr: 0.001
63
- n_vqvae_training_steps: 20000
64
- bet_weight_decay: 0.0002
65
- bet_learning_rate: 5.5e-05
66
- bet_betas:
67
- - 0.9
68
- - 0.999
69
  delta_timestamps:
70
  observation.image:
71
- - -0.4
72
- - -0.3
73
- - -0.2
74
  - -0.1
75
  - 0.0
76
  observation.state:
77
- - -0.4
78
- - -0.3
79
- - -0.2
80
  - -0.1
81
  - 0.0
82
  action:
83
- - -0.4
84
- - -0.3
85
- - -0.2
86
  - -0.1
87
  - 0.0
88
  - 0.1
@@ -95,6 +79,11 @@ training:
95
  - 0.8
96
  - 0.9
97
  - 1.0
 
 
 
 
 
98
  eval:
99
  n_episodes: 50
100
  batch_size: 50
@@ -143,10 +132,10 @@ override_dataset_stats:
143
  - 511.0
144
  - 511.0
145
  policy:
146
- name: vqbet
147
- n_obs_steps: 5
148
- n_action_pred_token: 7
149
- action_chunk_size: 5
150
  input_shapes:
151
  observation.image:
152
  - 3
@@ -170,20 +159,21 @@ policy:
170
  pretrained_backbone_weights: null
171
  use_group_norm: true
172
  spatial_softmax_num_keypoints: 32
173
- n_vqvae_training_steps: ${training.n_vqvae_training_steps}
174
- vqvae_n_embed: 16
175
- vqvae_embedding_dim: 256
176
- vqvae_enc_hidden_dim: 128
177
- gpt_block_size: 500
178
- gpt_input_dim: 512
179
- gpt_output_dim: 512
180
- gpt_n_layer: 8
181
- gpt_n_head: 8
182
- gpt_hidden_dim: 512
183
- dropout: 0.1
184
- mlp_hidden_dim: 1024
185
- offset_loss_weight: 10000.0
186
- primary_code_loss_weight: 5.0
187
- secondary_code_loss_weight: 0.5
188
- bet_softmax_temperature: 0.1
189
- sequentially_select: false
 
 
59
  - 0.999
60
  adam_eps: 1.0e-08
61
  adam_weight_decay: 1.0e-06
 
 
 
 
 
 
 
62
  delta_timestamps:
63
  observation.image:
 
 
 
64
  - -0.1
65
  - 0.0
66
  observation.state:
 
 
 
67
  - -0.1
68
  - 0.0
69
  action:
 
 
 
70
  - -0.1
71
  - 0.0
72
  - 0.1
 
79
  - 0.8
80
  - 0.9
81
  - 1.0
82
+ - 1.1
83
+ - 1.2
84
+ - 1.3
85
+ - 1.4
86
+ drop_n_last_frames: 7
87
  eval:
88
  n_episodes: 50
89
  batch_size: 50
 
132
  - 511.0
133
  - 511.0
134
  policy:
135
+ name: diffusion
136
+ n_obs_steps: 2
137
+ horizon: 16
138
+ n_action_steps: 8
139
  input_shapes:
140
  observation.image:
141
  - 3
 
159
  pretrained_backbone_weights: null
160
  use_group_norm: true
161
  spatial_softmax_num_keypoints: 32
162
+ down_dims:
163
+ - 512
164
+ - 1024
165
+ - 2048
166
+ kernel_size: 5
167
+ n_groups: 8
168
+ diffusion_step_embed_dim: 128
169
+ use_film_scale_modulation: true
170
+ noise_scheduler_type: DDPM
171
+ num_train_timesteps: 100
172
+ beta_schedule: squaredcos_cap_v2
173
+ beta_start: 0.0001
174
+ beta_end: 0.02
175
+ prediction_type: epsilon
176
+ clip_sample: true
177
+ clip_sample_range: 1.0
178
+ num_inference_steps: null
179
+ do_mask_loss_for_padding: false
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:670f97a37fb578a8da6eefa9ac8d019352899c0c6407e3a023433ce156c12a03
3
- size 158152442
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebd4f2ba3500b315a4f45f6d7ff6c6acfd3891c768fbae945cdc17e7ceff5e76
3
+ size 1050862408