File size: 1,543 Bytes
cb0f910 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 |
{
"data_root_dir": "/hai/scratch/belkhale/datasets",
"hf_token": ".hf_token",
"image_aug": false,
"is_resume": true,
"pretrained_checkpoint": "runs/prism-qwen25-dinosiglip-224px+0_5b+mx-libero-90+n1+b32+x7--vq_extra_tokenizer/checkpoints/step-065000-epoch-29-loss=0.4407.pt",
"resume_epoch": 29,
"resume_step": 65000,
"run_id": "prism-qwen25-dinosiglip-224px+0_5b+mx-libero-90+n1+b32+x7--vq_extra_tokenizer",
"run_id_note": "vq_extra_tokenizer",
"run_root_dir": "runs",
"save_interval": 2500,
"seed": 7,
"trackers": [
"jsonl",
"wandb"
],
"vla": {
"action_tokenizer": "libero_vq_extra_action_tokenizer",
"base_vlm": "prism-qwen25-extra-dinosiglip-224px+0_5b",
"data_mix": "libero_90",
"enable_gradient_checkpointing": true,
"enable_mixed_precision_training": true,
"epochs": 1000,
"expected_world_size": 8,
"freeze_llm_backbone": false,
"freeze_vision_backbone": false,
"global_batch_size": 256,
"learning_rate": 2e-05,
"lr_scheduler_type": "constant",
"max_grad_norm": 1.0,
"max_steps": null,
"per_device_batch_size": 32,
"reduce_in_full_precision": true,
"save_every_n_steps": 25000,
"shuffle_buffer_size": 256000,
"train_strategy": "fsdp-full-shard",
"type": "prism-qwen25-dinosiglip-224px+0_5b+mx-libero-90",
"unfreeze_last_llm_layer": false,
"vla_id": "prism-qwen25-dinosiglip-224px+0_5b+mx-libero-90",
"warmup_ratio": 0.0,
"weight_decay": 0.0
},
"wandb_entity": null,
"wandb_project": "prismatic"
} |