prosecalign
/

phi3m0128-cds-0.1-kendall-onof-ofif-corr-max-2-simpo-max1500-default

Transformers

Safetensors

Generated from Trainer

llama-factory

Inference Endpoints

Model card Files Files and versions Community

ziansu commited on 24 days ago

Commit

dfdf934

verified ·

1 Parent(s): ff8a202

Training in progress, step 150

Browse files

Files changed (2) hide show

adapter_model.safetensors +1 -1
trainer_log.jsonl +6 -0

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9bc2ec8127bbbd7aeb881dad40eaf3232d3ff807bff3c547126e17206e6d96ac
 size 25200088

 version https://git-lfs.github.com/spec/v1
+oid sha256:8ae25c255a7b56bc4ebf70ccebdfde6bb570562ec87babfa6d9afbbfaff3c6e1
 size 25200088

trainer_log.jsonl CHANGED Viewed

@@ -10,3 +10,9 @@
 {"current_steps": 90, "total_steps": 1500, "loss": 1.03, "accuracy": 0.22499999403953552, "learning_rate": 4.9557181268217225e-06, "epoch": 0.14125956444967627, "percentage": 6.0, "elapsed_time": "0:11:44", "remaining_time": "3:03:57", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 100, "total_steps": 1500, "loss": 1.0309, "accuracy": 0.26249998807907104, "learning_rate": 4.9453690018345144e-06, "epoch": 0.15695507161075142, "percentage": 6.67, "elapsed_time": "0:13:01", "remaining_time": "3:02:25", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 100, "total_steps": 1500, "eval_loss": 1.020836353302002, "epoch": 0.15695507161075142, "percentage": 6.67, "elapsed_time": "0:13:16", "remaining_time": "3:05:48", "throughput": "0.00", "total_tokens": 0}

 {"current_steps": 90, "total_steps": 1500, "loss": 1.03, "accuracy": 0.22499999403953552, "learning_rate": 4.9557181268217225e-06, "epoch": 0.14125956444967627, "percentage": 6.0, "elapsed_time": "0:11:44", "remaining_time": "3:03:57", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 100, "total_steps": 1500, "loss": 1.0309, "accuracy": 0.26249998807907104, "learning_rate": 4.9453690018345144e-06, "epoch": 0.15695507161075142, "percentage": 6.67, "elapsed_time": "0:13:01", "remaining_time": "3:02:25", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 100, "total_steps": 1500, "eval_loss": 1.020836353302002, "epoch": 0.15695507161075142, "percentage": 6.67, "elapsed_time": "0:13:16", "remaining_time": "3:05:48", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 110, "total_steps": 1500, "loss": 1.0388, "accuracy": 0.30000001192092896, "learning_rate": 4.933947257182901e-06, "epoch": 0.17265057877182657, "percentage": 7.33, "elapsed_time": "0:14:38", "remaining_time": "3:04:55", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 120, "total_steps": 1500, "loss": 1.0247, "accuracy": 0.25, "learning_rate": 4.921457902821578e-06, "epoch": 0.1883460859329017, "percentage": 8.0, "elapsed_time": "0:15:56", "remaining_time": "3:03:19", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 130, "total_steps": 1500, "loss": 1.0169, "accuracy": 0.30000001192092896, "learning_rate": 4.907906416994146e-06, "epoch": 0.20404159309397685, "percentage": 8.67, "elapsed_time": "0:17:11", "remaining_time": "3:01:13", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 140, "total_steps": 1500, "loss": 0.9964, "accuracy": 0.3499999940395355, "learning_rate": 4.893298743830168e-06, "epoch": 0.219737100255052, "percentage": 9.33, "elapsed_time": "0:18:27", "remaining_time": "2:59:18", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 150, "total_steps": 1500, "loss": 1.0073, "accuracy": 0.30000001192092896, "learning_rate": 4.8776412907378845e-06, "epoch": 0.23543260741612712, "percentage": 10.0, "elapsed_time": "0:19:45", "remaining_time": "2:57:45", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 150, "total_steps": 1500, "eval_loss": 0.9802881479263306, "epoch": 0.23543260741612712, "percentage": 10.0, "elapsed_time": "0:19:59", "remaining_time": "2:59:55", "throughput": "0.00", "total_tokens": 0}