Training in progress, step 150
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +6 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 25200088
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ae25c255a7b56bc4ebf70ccebdfde6bb570562ec87babfa6d9afbbfaff3c6e1
|
3 |
size 25200088
|
trainer_log.jsonl
CHANGED
@@ -10,3 +10,9 @@
|
|
10 |
{"current_steps": 90, "total_steps": 1500, "loss": 1.03, "accuracy": 0.22499999403953552, "learning_rate": 4.9557181268217225e-06, "epoch": 0.14125956444967627, "percentage": 6.0, "elapsed_time": "0:11:44", "remaining_time": "3:03:57", "throughput": "0.00", "total_tokens": 0}
|
11 |
{"current_steps": 100, "total_steps": 1500, "loss": 1.0309, "accuracy": 0.26249998807907104, "learning_rate": 4.9453690018345144e-06, "epoch": 0.15695507161075142, "percentage": 6.67, "elapsed_time": "0:13:01", "remaining_time": "3:02:25", "throughput": "0.00", "total_tokens": 0}
|
12 |
{"current_steps": 100, "total_steps": 1500, "eval_loss": 1.020836353302002, "epoch": 0.15695507161075142, "percentage": 6.67, "elapsed_time": "0:13:16", "remaining_time": "3:05:48", "throughput": "0.00", "total_tokens": 0}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10 |
{"current_steps": 90, "total_steps": 1500, "loss": 1.03, "accuracy": 0.22499999403953552, "learning_rate": 4.9557181268217225e-06, "epoch": 0.14125956444967627, "percentage": 6.0, "elapsed_time": "0:11:44", "remaining_time": "3:03:57", "throughput": "0.00", "total_tokens": 0}
|
11 |
{"current_steps": 100, "total_steps": 1500, "loss": 1.0309, "accuracy": 0.26249998807907104, "learning_rate": 4.9453690018345144e-06, "epoch": 0.15695507161075142, "percentage": 6.67, "elapsed_time": "0:13:01", "remaining_time": "3:02:25", "throughput": "0.00", "total_tokens": 0}
|
12 |
{"current_steps": 100, "total_steps": 1500, "eval_loss": 1.020836353302002, "epoch": 0.15695507161075142, "percentage": 6.67, "elapsed_time": "0:13:16", "remaining_time": "3:05:48", "throughput": "0.00", "total_tokens": 0}
|
13 |
+
{"current_steps": 110, "total_steps": 1500, "loss": 1.0388, "accuracy": 0.30000001192092896, "learning_rate": 4.933947257182901e-06, "epoch": 0.17265057877182657, "percentage": 7.33, "elapsed_time": "0:14:38", "remaining_time": "3:04:55", "throughput": "0.00", "total_tokens": 0}
|
14 |
+
{"current_steps": 120, "total_steps": 1500, "loss": 1.0247, "accuracy": 0.25, "learning_rate": 4.921457902821578e-06, "epoch": 0.1883460859329017, "percentage": 8.0, "elapsed_time": "0:15:56", "remaining_time": "3:03:19", "throughput": "0.00", "total_tokens": 0}
|
15 |
+
{"current_steps": 130, "total_steps": 1500, "loss": 1.0169, "accuracy": 0.30000001192092896, "learning_rate": 4.907906416994146e-06, "epoch": 0.20404159309397685, "percentage": 8.67, "elapsed_time": "0:17:11", "remaining_time": "3:01:13", "throughput": "0.00", "total_tokens": 0}
|
16 |
+
{"current_steps": 140, "total_steps": 1500, "loss": 0.9964, "accuracy": 0.3499999940395355, "learning_rate": 4.893298743830168e-06, "epoch": 0.219737100255052, "percentage": 9.33, "elapsed_time": "0:18:27", "remaining_time": "2:59:18", "throughput": "0.00", "total_tokens": 0}
|
17 |
+
{"current_steps": 150, "total_steps": 1500, "loss": 1.0073, "accuracy": 0.30000001192092896, "learning_rate": 4.8776412907378845e-06, "epoch": 0.23543260741612712, "percentage": 10.0, "elapsed_time": "0:19:45", "remaining_time": "2:57:45", "throughput": "0.00", "total_tokens": 0}
|
18 |
+
{"current_steps": 150, "total_steps": 1500, "eval_loss": 0.9802881479263306, "epoch": 0.23543260741612712, "percentage": 10.0, "elapsed_time": "0:19:59", "remaining_time": "2:59:55", "throughput": "0.00", "total_tokens": 0}
|