|
{ |
|
"base_model_name": "meta-llama_Meta-Llama-3-8B", |
|
"base_model_class": "LlamaForCausalLM", |
|
"base_loaded_in_4bit": false, |
|
"base_loaded_in_8bit": false, |
|
"projections": "q, v", |
|
"loss": 0.9512, |
|
"grad_norm": 0.6213752031326294, |
|
"learning_rate": 0.0005979381443298969, |
|
"epoch": 4.028685258964144, |
|
"current_steps": 10055, |
|
"current_steps_adjusted": 10055, |
|
"epoch_adjusted": 4.028685258964144, |
|
"train_runtime": 3864.6216, |
|
"train_samples_per_second": 25.977, |
|
"train_steps_per_second": 0.101, |
|
"total_flos": 4.69608070712918e+17, |
|
"train_loss": 1.8759732170950008 |
|
} |