CheesefireV3lora / training_log.json
foilfoilfoil's picture
Upload 6 files
ea000b9
raw
history blame contribute delete
474 Bytes
{
"base_model_name": "elinas_llama-7b-hf-transformers-4.29",
"base_model_class": "LlamaForCausalLM",
"base_loaded_in_4bit": true,
"base_loaded_in_8bit": false,
"projections": "q, v",
"loss": 1.2101,
"learning_rate": 4.1443278256170227e-10,
"epoch": 1.99,
"current_steps": 15686,
"train_runtime": 47331.0727,
"train_samples_per_second": 0.67,
"train_steps_per_second": 0.005,
"total_flos": 6.648022708267254e+17,
"train_loss": 1.2976071742491992
}