Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d26ac89b433098421fed856645e713bd1b6a77e12f30775e2bdb04a6418350a2
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e369b152203a4637d5390d5d275a193464a58055e136ab366d2652d89878b75e
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c123299d6fae495f4f23650c70503f25676f9b440d19f2858084c4e92edde846
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a5fede60b30e9f4b392b6849c679350f1b469036bb25f8bd24fe69022be1205
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -87,3 +87,44 @@
|
|
87 |
{"current_steps": 850, "total_steps": 1266, "loss": 0.2369, "lr": 5e-06, "epoch": 2.014218009478673, "percentage": 67.14, "elapsed_time": "1:28:00", "remaining_time": "0:43:04"}
|
88 |
{"current_steps": 860, "total_steps": 1266, "loss": 0.2195, "lr": 5e-06, "epoch": 2.037914691943128, "percentage": 67.93, "elapsed_time": "1:28:58", "remaining_time": "0:42:00"}
|
89 |
{"current_steps": 870, "total_steps": 1266, "loss": 0.2199, "lr": 5e-06, "epoch": 2.061611374407583, "percentage": 68.72, "elapsed_time": "1:29:59", "remaining_time": "0:40:57"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
87 |
{"current_steps": 850, "total_steps": 1266, "loss": 0.2369, "lr": 5e-06, "epoch": 2.014218009478673, "percentage": 67.14, "elapsed_time": "1:28:00", "remaining_time": "0:43:04"}
|
88 |
{"current_steps": 860, "total_steps": 1266, "loss": 0.2195, "lr": 5e-06, "epoch": 2.037914691943128, "percentage": 67.93, "elapsed_time": "1:28:58", "remaining_time": "0:42:00"}
|
89 |
{"current_steps": 870, "total_steps": 1266, "loss": 0.2199, "lr": 5e-06, "epoch": 2.061611374407583, "percentage": 68.72, "elapsed_time": "1:29:59", "remaining_time": "0:40:57"}
|
90 |
+
{"current_steps": 880, "total_steps": 1266, "loss": 0.2204, "lr": 5e-06, "epoch": 2.085308056872038, "percentage": 69.51, "elapsed_time": "1:30:57", "remaining_time": "0:39:53"}
|
91 |
+
{"current_steps": 890, "total_steps": 1266, "loss": 0.2207, "lr": 5e-06, "epoch": 2.109004739336493, "percentage": 70.3, "elapsed_time": "1:31:56", "remaining_time": "0:38:50"}
|
92 |
+
{"current_steps": 900, "total_steps": 1266, "loss": 0.2205, "lr": 5e-06, "epoch": 2.132701421800948, "percentage": 71.09, "elapsed_time": "1:32:55", "remaining_time": "0:37:47"}
|
93 |
+
{"current_steps": 910, "total_steps": 1266, "loss": 0.2202, "lr": 5e-06, "epoch": 2.156398104265403, "percentage": 71.88, "elapsed_time": "1:33:53", "remaining_time": "0:36:43"}
|
94 |
+
{"current_steps": 920, "total_steps": 1266, "loss": 0.2213, "lr": 5e-06, "epoch": 2.1800947867298577, "percentage": 72.67, "elapsed_time": "1:34:51", "remaining_time": "0:35:40"}
|
95 |
+
{"current_steps": 930, "total_steps": 1266, "loss": 0.2237, "lr": 5e-06, "epoch": 2.2037914691943126, "percentage": 73.46, "elapsed_time": "1:35:50", "remaining_time": "0:34:37"}
|
96 |
+
{"current_steps": 940, "total_steps": 1266, "loss": 0.2196, "lr": 5e-06, "epoch": 2.227488151658768, "percentage": 74.25, "elapsed_time": "1:36:48", "remaining_time": "0:33:34"}
|
97 |
+
{"current_steps": 950, "total_steps": 1266, "loss": 0.2213, "lr": 5e-06, "epoch": 2.251184834123223, "percentage": 75.04, "elapsed_time": "1:37:48", "remaining_time": "0:32:32"}
|
98 |
+
{"current_steps": 960, "total_steps": 1266, "loss": 0.22, "lr": 5e-06, "epoch": 2.2748815165876777, "percentage": 75.83, "elapsed_time": "1:38:46", "remaining_time": "0:31:29"}
|
99 |
+
{"current_steps": 970, "total_steps": 1266, "loss": 0.2209, "lr": 5e-06, "epoch": 2.2985781990521326, "percentage": 76.62, "elapsed_time": "1:39:45", "remaining_time": "0:30:26"}
|
100 |
+
{"current_steps": 980, "total_steps": 1266, "loss": 0.225, "lr": 5e-06, "epoch": 2.322274881516588, "percentage": 77.41, "elapsed_time": "1:40:44", "remaining_time": "0:29:24"}
|
101 |
+
{"current_steps": 990, "total_steps": 1266, "loss": 0.2236, "lr": 5e-06, "epoch": 2.345971563981043, "percentage": 78.2, "elapsed_time": "1:41:43", "remaining_time": "0:28:21"}
|
102 |
+
{"current_steps": 1000, "total_steps": 1266, "loss": 0.2216, "lr": 5e-06, "epoch": 2.3696682464454977, "percentage": 78.99, "elapsed_time": "1:42:42", "remaining_time": "0:27:19"}
|
103 |
+
{"current_steps": 1010, "total_steps": 1266, "loss": 0.2233, "lr": 5e-06, "epoch": 2.3933649289099526, "percentage": 79.78, "elapsed_time": "1:43:40", "remaining_time": "0:26:16"}
|
104 |
+
{"current_steps": 1020, "total_steps": 1266, "loss": 0.2228, "lr": 5e-06, "epoch": 2.4170616113744074, "percentage": 80.57, "elapsed_time": "1:44:38", "remaining_time": "0:25:14"}
|
105 |
+
{"current_steps": 1030, "total_steps": 1266, "loss": 0.2226, "lr": 5e-06, "epoch": 2.4407582938388623, "percentage": 81.36, "elapsed_time": "1:45:36", "remaining_time": "0:24:11"}
|
106 |
+
{"current_steps": 1040, "total_steps": 1266, "loss": 0.2211, "lr": 5e-06, "epoch": 2.4644549763033177, "percentage": 82.15, "elapsed_time": "1:46:35", "remaining_time": "0:23:09"}
|
107 |
+
{"current_steps": 1050, "total_steps": 1266, "loss": 0.2225, "lr": 5e-06, "epoch": 2.4881516587677726, "percentage": 82.94, "elapsed_time": "1:47:34", "remaining_time": "0:22:07"}
|
108 |
+
{"current_steps": 1060, "total_steps": 1266, "loss": 0.2207, "lr": 5e-06, "epoch": 2.5118483412322274, "percentage": 83.73, "elapsed_time": "1:48:33", "remaining_time": "0:21:05"}
|
109 |
+
{"current_steps": 1070, "total_steps": 1266, "loss": 0.2224, "lr": 5e-06, "epoch": 2.5355450236966823, "percentage": 84.52, "elapsed_time": "1:49:32", "remaining_time": "0:20:03"}
|
110 |
+
{"current_steps": 1080, "total_steps": 1266, "loss": 0.2193, "lr": 5e-06, "epoch": 2.5592417061611377, "percentage": 85.31, "elapsed_time": "1:50:32", "remaining_time": "0:19:02"}
|
111 |
+
{"current_steps": 1090, "total_steps": 1266, "loss": 0.2215, "lr": 5e-06, "epoch": 2.5829383886255926, "percentage": 86.1, "elapsed_time": "1:51:30", "remaining_time": "0:18:00"}
|
112 |
+
{"current_steps": 1100, "total_steps": 1266, "loss": 0.2239, "lr": 5e-06, "epoch": 2.6066350710900474, "percentage": 86.89, "elapsed_time": "1:52:29", "remaining_time": "0:16:58"}
|
113 |
+
{"current_steps": 1110, "total_steps": 1266, "loss": 0.225, "lr": 5e-06, "epoch": 2.6303317535545023, "percentage": 87.68, "elapsed_time": "1:53:27", "remaining_time": "0:15:56"}
|
114 |
+
{"current_steps": 1120, "total_steps": 1266, "loss": 0.2217, "lr": 5e-06, "epoch": 2.654028436018957, "percentage": 88.47, "elapsed_time": "1:54:25", "remaining_time": "0:14:54"}
|
115 |
+
{"current_steps": 1130, "total_steps": 1266, "loss": 0.2223, "lr": 5e-06, "epoch": 2.677725118483412, "percentage": 89.26, "elapsed_time": "1:55:23", "remaining_time": "0:13:53"}
|
116 |
+
{"current_steps": 1140, "total_steps": 1266, "loss": 0.2202, "lr": 5e-06, "epoch": 2.7014218009478674, "percentage": 90.05, "elapsed_time": "1:56:22", "remaining_time": "0:12:51"}
|
117 |
+
{"current_steps": 1150, "total_steps": 1266, "loss": 0.2203, "lr": 5e-06, "epoch": 2.7251184834123223, "percentage": 90.84, "elapsed_time": "1:57:20", "remaining_time": "0:11:50"}
|
118 |
+
{"current_steps": 1160, "total_steps": 1266, "loss": 0.2195, "lr": 5e-06, "epoch": 2.748815165876777, "percentage": 91.63, "elapsed_time": "1:58:19", "remaining_time": "0:10:48"}
|
119 |
+
{"current_steps": 1170, "total_steps": 1266, "loss": 0.2201, "lr": 5e-06, "epoch": 2.772511848341232, "percentage": 92.42, "elapsed_time": "1:59:18", "remaining_time": "0:09:47"}
|
120 |
+
{"current_steps": 1180, "total_steps": 1266, "loss": 0.2241, "lr": 5e-06, "epoch": 2.7962085308056874, "percentage": 93.21, "elapsed_time": "2:00:17", "remaining_time": "0:08:46"}
|
121 |
+
{"current_steps": 1190, "total_steps": 1266, "loss": 0.2185, "lr": 5e-06, "epoch": 2.8199052132701423, "percentage": 94.0, "elapsed_time": "2:01:15", "remaining_time": "0:07:44"}
|
122 |
+
{"current_steps": 1200, "total_steps": 1266, "loss": 0.2218, "lr": 5e-06, "epoch": 2.843601895734597, "percentage": 94.79, "elapsed_time": "2:02:14", "remaining_time": "0:06:43"}
|
123 |
+
{"current_steps": 1210, "total_steps": 1266, "loss": 0.2211, "lr": 5e-06, "epoch": 2.867298578199052, "percentage": 95.58, "elapsed_time": "2:03:12", "remaining_time": "0:05:42"}
|
124 |
+
{"current_steps": 1220, "total_steps": 1266, "loss": 0.2194, "lr": 5e-06, "epoch": 2.890995260663507, "percentage": 96.37, "elapsed_time": "2:04:10", "remaining_time": "0:04:40"}
|
125 |
+
{"current_steps": 1230, "total_steps": 1266, "loss": 0.2258, "lr": 5e-06, "epoch": 2.914691943127962, "percentage": 97.16, "elapsed_time": "2:05:09", "remaining_time": "0:03:39"}
|
126 |
+
{"current_steps": 1240, "total_steps": 1266, "loss": 0.2218, "lr": 5e-06, "epoch": 2.938388625592417, "percentage": 97.95, "elapsed_time": "2:06:07", "remaining_time": "0:02:38"}
|
127 |
+
{"current_steps": 1250, "total_steps": 1266, "loss": 0.2211, "lr": 5e-06, "epoch": 2.962085308056872, "percentage": 98.74, "elapsed_time": "2:07:07", "remaining_time": "0:01:37"}
|
128 |
+
{"current_steps": 1260, "total_steps": 1266, "loss": 0.2241, "lr": 5e-06, "epoch": 2.985781990521327, "percentage": 99.53, "elapsed_time": "2:08:39", "remaining_time": "0:00:36"}
|
129 |
+
{"current_steps": 1266, "total_steps": 1266, "eval_loss": 0.30088362097740173, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:11:24", "remaining_time": "0:00:00"}
|
130 |
+
{"current_steps": 1266, "total_steps": 1266, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:13:03", "remaining_time": "0:00:00"}
|