Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:135eff8528ad6c5d038fc9630137d1054b68be9e9de16a63cf181b814e5a11a3
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d69ed7a15b0168305cdd64ce9ddbf455a11e67df8d2f9854148d0901c8b2fcb
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53c39fb1a308761ff2f24aaeea65b8b4ec41c248e5b8ba9dd7eb129cc45887c2
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:656cdfc8446799100fd9224bd5409685ad25140ce1d59195c4e175b2dd524a40
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -2,3 +2,8 @@
|
|
2 |
{"current_steps": 20, "total_steps": 105, "loss": 1.087, "lr": 5e-06, "epoch": 0.5663716814159292, "percentage": 19.05, "elapsed_time": "0:53:44", "remaining_time": "3:48:24"}
|
3 |
{"current_steps": 30, "total_steps": 105, "loss": 1.0474, "lr": 5e-06, "epoch": 0.8495575221238938, "percentage": 28.57, "elapsed_time": "1:20:33", "remaining_time": "3:21:23"}
|
4 |
{"current_steps": 35, "total_steps": 105, "eval_loss": 1.021984577178955, "epoch": 0.9911504424778761, "percentage": 33.33, "elapsed_time": "1:36:48", "remaining_time": "3:13:36"}
|
|
|
|
|
|
|
|
|
|
|
|
2 |
{"current_steps": 20, "total_steps": 105, "loss": 1.087, "lr": 5e-06, "epoch": 0.5663716814159292, "percentage": 19.05, "elapsed_time": "0:53:44", "remaining_time": "3:48:24"}
|
3 |
{"current_steps": 30, "total_steps": 105, "loss": 1.0474, "lr": 5e-06, "epoch": 0.8495575221238938, "percentage": 28.57, "elapsed_time": "1:20:33", "remaining_time": "3:21:23"}
|
4 |
{"current_steps": 35, "total_steps": 105, "eval_loss": 1.021984577178955, "epoch": 0.9911504424778761, "percentage": 33.33, "elapsed_time": "1:36:48", "remaining_time": "3:13:36"}
|
5 |
+
{"current_steps": 40, "total_steps": 105, "loss": 1.0097, "lr": 5e-06, "epoch": 1.1327433628318584, "percentage": 38.1, "elapsed_time": "1:50:31", "remaining_time": "2:59:36"}
|
6 |
+
{"current_steps": 50, "total_steps": 105, "loss": 0.9766, "lr": 5e-06, "epoch": 1.415929203539823, "percentage": 47.62, "elapsed_time": "2:16:27", "remaining_time": "2:30:06"}
|
7 |
+
{"current_steps": 60, "total_steps": 105, "loss": 0.9627, "lr": 5e-06, "epoch": 1.6991150442477876, "percentage": 57.14, "elapsed_time": "2:42:23", "remaining_time": "2:01:47"}
|
8 |
+
{"current_steps": 70, "total_steps": 105, "loss": 0.9547, "lr": 5e-06, "epoch": 1.9823008849557522, "percentage": 66.67, "elapsed_time": "3:08:20", "remaining_time": "1:34:10"}
|
9 |
+
{"current_steps": 70, "total_steps": 105, "eval_loss": 0.9805734157562256, "epoch": 1.9823008849557522, "percentage": 66.67, "elapsed_time": "3:11:46", "remaining_time": "1:35:53"}
|