|
{ |
|
"os": "Linux-6.8.0-48-generic-x86_64-with-glibc2.39", |
|
"python": "3.10.0", |
|
"heartbeatAt": "2025-01-04T20:33:14.710667", |
|
"startedAt": "2025-01-04T20:33:14.192552", |
|
"docker": null, |
|
"cuda": null, |
|
"args": [ |
|
"--model_family", |
|
"llama", |
|
"--apply_instruct_masks", |
|
"--token_scaled_loss", |
|
"--seq_parallel_size", |
|
"4", |
|
"--report_to", |
|
"wandb", |
|
"--do_train", |
|
"--model_name_or_path", |
|
"/scratch3/workspace/ctpham_umass_edu-ft/models/Llama-3-8B-ProLong-512k-Base/", |
|
"--config_name", |
|
"/scratch3/workspace/ctpham_umass_edu-ft/models/Llama-3-8B-ProLong-512k-Base/", |
|
"--tokenizer_name", |
|
"/scratch3/workspace/ctpham_umass_edu-ft/models/Llama-3-8B-ProLong-512k-Base/", |
|
"--run_name", |
|
"wp_hparam_prolong-512K-base_bsz-16_lr-1e-5_epochs-1_", |
|
"--output_dir", |
|
"/scratch3/workspace/ctpham_umass_edu-models/wp_hparam_prolong-512K-base_bsz-16_lr-1e-5_epochs-1_", |
|
"--config_overrides_json", |
|
"", |
|
"--gradient_accumulation_steps", |
|
"4", |
|
"--per_device_train_batch_size", |
|
"1", |
|
"--bf16", |
|
"--learning_rate", |
|
"1e-5", |
|
"--min_lr_ratio", |
|
"0.1", |
|
"--lr_scheduler_type", |
|
"cosine", |
|
"--max_grad_norm", |
|
"1.0", |
|
"--adam_beta1", |
|
"0.9", |
|
"--adam_beta2", |
|
"0.95", |
|
"--weight_decay", |
|
"0.1", |
|
"--warmup_ratio", |
|
"0.05", |
|
"--optim", |
|
"adamw_torch", |
|
"--logging_steps", |
|
"1", |
|
"--log_level", |
|
"info", |
|
"--save_steps", |
|
"100", |
|
"--dataloader_num_workers", |
|
"1", |
|
"--disable_tqdm", |
|
"true", |
|
"--use_fast_tokenizer", |
|
"false", |
|
"--remove_unused_columns", |
|
"false", |
|
"--ddp_find_unused_parameters", |
|
"false", |
|
"--fsdp", |
|
"auto_wrap offload", |
|
"--gradient_checkpointing", |
|
"--tokenized_mds_train", |
|
"/work/pi_miyyer_umass_edu/ctpham/BookClaim-dev/data/ft/bookclaim_wp_pack_complete", |
|
"--cuda_empty_cache", |
|
"--num_train_epochs", |
|
"1" |
|
], |
|
"state": "running", |
|
"program": "/work/pi_miyyer_umass_edu/ctpham/BookClaim-dev/prolong-final/finetune.py", |
|
"codePathLocal": "finetune.py", |
|
"codePath": "prolong-final/finetune.py", |
|
"git": { |
|
"remote": "https://github.com/chtmp223/BookGen-dev.git", |
|
"commit": "9c36a7f300815c07d8a1bbceedfa1ef3781014f6" |
|
}, |
|
"email": "[email protected]", |
|
"root": "/work/pi_miyyer_umass_edu/ctpham/BookClaim-dev", |
|
"host": "gpu016", |
|
"username": "ctpham_umass_edu", |
|
"executable": "/scratch3/workspace/ctpham_umass_edu-ft/envs/prolong-final/bin/python3.10", |
|
"cpu_count": 112, |
|
"cpu_count_logical": 112, |
|
"cpu_freq": { |
|
"current": 1279.2346785714285, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
"cpu_freq_per_core": [ |
|
{ |
|
"current": 765.676, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 763.953, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 2999.969, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 786.059, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.44, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 1500.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 2017.085, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 2400.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 1400.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 2074.358, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 1899.98, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 2400.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 2059.821, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 784.691, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 793.56, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 793.216, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 756.065, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 785.354, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 791.656, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 2999.969, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 3000.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 765.39, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
}, |
|
{ |
|
"current": 800.0, |
|
"min": 800.0, |
|
"max": 3800.0 |
|
} |
|
], |
|
"disk": { |
|
"/": { |
|
"total": 438.487850189209, |
|
"used": 16.89361572265625 |
|
} |
|
}, |
|
"gpu": "NVIDIA A100-SXM4-80GB", |
|
"gpu_count": 4, |
|
"gpu_devices": [ |
|
{ |
|
"name": "NVIDIA A100-SXM4-80GB", |
|
"memory_total": 85899345920 |
|
}, |
|
{ |
|
"name": "NVIDIA A100-SXM4-80GB", |
|
"memory_total": 85899345920 |
|
}, |
|
{ |
|
"name": "NVIDIA A100-SXM4-80GB", |
|
"memory_total": 85899345920 |
|
}, |
|
{ |
|
"name": "NVIDIA A100-SXM4-80GB", |
|
"memory_total": 85899345920 |
|
} |
|
], |
|
"memory": { |
|
"total": 2015.3284606933594 |
|
} |
|
} |
|
|