Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74aa81d766747d487f5a38c3cc685cf2b5658a2f161daf2b57bdc1187a83427c
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29820c7b952833040fb380b8d89b2b1fded592db490f56481f1e40a5b9eb21a6
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecfc94d45b1253da45117f224273a2546ee2b608d664169272b166a1b7a6fe77
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c8a6d37e7d9880f56f58873302a20d4f642dd63a9074b300d21d93b823f6627
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -12,3 +12,10 @@
|
|
12 |
{"current_steps": 110, "total_steps": 177, "loss": 0.6543, "lr": 5e-06, "epoch": 1.8469601677148848, "percentage": 62.15, "elapsed_time": "1:48:08", "remaining_time": "1:05:52"}
|
13 |
{"current_steps": 119, "total_steps": 177, "eval_loss": 0.6759442090988159, "epoch": 1.9979035639412999, "percentage": 67.23, "elapsed_time": "1:57:51", "remaining_time": "0:57:26"}
|
14 |
{"current_steps": 120, "total_steps": 177, "loss": 0.6821, "lr": 5e-06, "epoch": 2.0167714884696015, "percentage": 67.8, "elapsed_time": "2:00:03", "remaining_time": "0:57:01"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12 |
{"current_steps": 110, "total_steps": 177, "loss": 0.6543, "lr": 5e-06, "epoch": 1.8469601677148848, "percentage": 62.15, "elapsed_time": "1:48:08", "remaining_time": "1:05:52"}
|
13 |
{"current_steps": 119, "total_steps": 177, "eval_loss": 0.6759442090988159, "epoch": 1.9979035639412999, "percentage": 67.23, "elapsed_time": "1:57:51", "remaining_time": "0:57:26"}
|
14 |
{"current_steps": 120, "total_steps": 177, "loss": 0.6821, "lr": 5e-06, "epoch": 2.0167714884696015, "percentage": 67.8, "elapsed_time": "2:00:03", "remaining_time": "0:57:01"}
|
15 |
+
{"current_steps": 130, "total_steps": 177, "loss": 0.6222, "lr": 5e-06, "epoch": 2.1844863731656186, "percentage": 73.45, "elapsed_time": "2:09:40", "remaining_time": "0:46:52"}
|
16 |
+
{"current_steps": 140, "total_steps": 177, "loss": 0.6206, "lr": 5e-06, "epoch": 2.352201257861635, "percentage": 79.1, "elapsed_time": "2:19:18", "remaining_time": "0:36:49"}
|
17 |
+
{"current_steps": 150, "total_steps": 177, "loss": 0.6165, "lr": 5e-06, "epoch": 2.519916142557652, "percentage": 84.75, "elapsed_time": "2:28:56", "remaining_time": "0:26:48"}
|
18 |
+
{"current_steps": 160, "total_steps": 177, "loss": 0.6165, "lr": 5e-06, "epoch": 2.6876310272536688, "percentage": 90.4, "elapsed_time": "2:38:34", "remaining_time": "0:16:50"}
|
19 |
+
{"current_steps": 170, "total_steps": 177, "loss": 0.6175, "lr": 5e-06, "epoch": 2.8553459119496853, "percentage": 96.05, "elapsed_time": "2:48:12", "remaining_time": "0:06:55"}
|
20 |
+
{"current_steps": 177, "total_steps": 177, "eval_loss": 0.6712015867233276, "epoch": 2.9727463312368974, "percentage": 100.0, "elapsed_time": "2:57:17", "remaining_time": "0:00:00"}
|
21 |
+
{"current_steps": 177, "total_steps": 177, "epoch": 2.9727463312368974, "percentage": 100.0, "elapsed_time": "2:58:32", "remaining_time": "0:00:00"}
|