Safetensors
English
llama
chtmp223's picture
Upload folder using huggingface_hub
ba0d393 verified
{
"os": "Linux-6.8.0-48-generic-x86_64-with-glibc2.39",
"python": "3.10.0",
"heartbeatAt": "2025-01-04T20:33:14.710667",
"startedAt": "2025-01-04T20:33:14.192552",
"docker": null,
"cuda": null,
"args": [
"--model_family",
"llama",
"--apply_instruct_masks",
"--token_scaled_loss",
"--seq_parallel_size",
"4",
"--report_to",
"wandb",
"--do_train",
"--model_name_or_path",
"/scratch3/workspace/ctpham_umass_edu-ft/models/Llama-3-8B-ProLong-512k-Base/",
"--config_name",
"/scratch3/workspace/ctpham_umass_edu-ft/models/Llama-3-8B-ProLong-512k-Base/",
"--tokenizer_name",
"/scratch3/workspace/ctpham_umass_edu-ft/models/Llama-3-8B-ProLong-512k-Base/",
"--run_name",
"wp_hparam_prolong-512K-base_bsz-16_lr-1e-5_epochs-1_",
"--output_dir",
"/scratch3/workspace/ctpham_umass_edu-models/wp_hparam_prolong-512K-base_bsz-16_lr-1e-5_epochs-1_",
"--config_overrides_json",
"",
"--gradient_accumulation_steps",
"4",
"--per_device_train_batch_size",
"1",
"--bf16",
"--learning_rate",
"1e-5",
"--min_lr_ratio",
"0.1",
"--lr_scheduler_type",
"cosine",
"--max_grad_norm",
"1.0",
"--adam_beta1",
"0.9",
"--adam_beta2",
"0.95",
"--weight_decay",
"0.1",
"--warmup_ratio",
"0.05",
"--optim",
"adamw_torch",
"--logging_steps",
"1",
"--log_level",
"info",
"--save_steps",
"100",
"--dataloader_num_workers",
"1",
"--disable_tqdm",
"true",
"--use_fast_tokenizer",
"false",
"--remove_unused_columns",
"false",
"--ddp_find_unused_parameters",
"false",
"--fsdp",
"auto_wrap offload",
"--gradient_checkpointing",
"--tokenized_mds_train",
"/work/pi_miyyer_umass_edu/ctpham/BookClaim-dev/data/ft/bookclaim_wp_pack_complete",
"--cuda_empty_cache",
"--num_train_epochs",
"1"
],
"state": "running",
"program": "/work/pi_miyyer_umass_edu/ctpham/BookClaim-dev/prolong-final/finetune.py",
"codePathLocal": "finetune.py",
"codePath": "prolong-final/finetune.py",
"git": {
"remote": "https://github.com/chtmp223/BookGen-dev.git",
"commit": "9c36a7f300815c07d8a1bbceedfa1ef3781014f6"
},
"email": "[email protected]",
"root": "/work/pi_miyyer_umass_edu/ctpham/BookClaim-dev",
"host": "gpu016",
"username": "ctpham_umass_edu",
"executable": "/scratch3/workspace/ctpham_umass_edu-ft/envs/prolong-final/bin/python3.10",
"cpu_count": 112,
"cpu_count_logical": 112,
"cpu_freq": {
"current": 1279.2346785714285,
"min": 800.0,
"max": 3800.0
},
"cpu_freq_per_core": [
{
"current": 765.676,
"min": 800.0,
"max": 3800.0
},
{
"current": 763.953,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 2999.969,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 786.059,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.44,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 1500.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 2017.085,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 2400.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 1400.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 2074.358,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 1899.98,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 2400.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 2059.821,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 784.691,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 793.56,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 793.216,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 756.065,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 785.354,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 791.656,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 2999.969,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 3000.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 765.39,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
},
{
"current": 800.0,
"min": 800.0,
"max": 3800.0
}
],
"disk": {
"/": {
"total": 438.487850189209,
"used": 16.89361572265625
}
},
"gpu": "NVIDIA A100-SXM4-80GB",
"gpu_count": 4,
"gpu_devices": [
{
"name": "NVIDIA A100-SXM4-80GB",
"memory_total": 85899345920
},
{
"name": "NVIDIA A100-SXM4-80GB",
"memory_total": 85899345920
},
{
"name": "NVIDIA A100-SXM4-80GB",
"memory_total": 85899345920
},
{
"name": "NVIDIA A100-SXM4-80GB",
"memory_total": 85899345920
}
],
"memory": {
"total": 2015.3284606933594
}
}