Model save
Browse files- all_results.json +8 -8
- eval_results.json +4 -4
- model-00001-of-00003.safetensors +1 -1
- model-00002-of-00003.safetensors +1 -1
- model-00003-of-00003.safetensors +1 -1
- runs/Jan04_11-14-47_ip-26-0-173-202/events.out.tfevents.1704366960.ip-26-0-173-202.768748.0 +3 -0
- runs/Jan04_11-14-47_ip-26-0-173-202/events.out.tfevents.1704367666.ip-26-0-173-202.768748.1 +3 -0
- train_results.json +4 -4
- trainer_state.json +11 -11
- training_args.bin +1 -1
all_results.json
CHANGED
@@ -1,13 +1,13 @@
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
-
"eval_loss": 0.
|
4 |
-
"eval_runtime": 142.
|
5 |
"eval_samples": 23110,
|
6 |
-
"eval_samples_per_second": 108.
|
7 |
-
"eval_steps_per_second": 1.
|
8 |
-
"train_loss": 0.
|
9 |
-
"train_runtime": 563.
|
10 |
"train_samples": 207865,
|
11 |
-
"train_samples_per_second": 247.
|
12 |
-
"train_steps_per_second": 1.
|
13 |
}
|
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
+
"eval_loss": 0.9360852241516113,
|
4 |
+
"eval_runtime": 142.4913,
|
5 |
"eval_samples": 23110,
|
6 |
+
"eval_samples_per_second": 108.294,
|
7 |
+
"eval_steps_per_second": 1.698,
|
8 |
+
"train_loss": 0.07633398782222643,
|
9 |
+
"train_runtime": 563.604,
|
10 |
"train_samples": 207865,
|
11 |
+
"train_samples_per_second": 247.383,
|
12 |
+
"train_steps_per_second": 1.934
|
13 |
}
|
eval_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
-
"eval_loss": 0.
|
4 |
-
"eval_runtime": 142.
|
5 |
"eval_samples": 23110,
|
6 |
-
"eval_samples_per_second": 108.
|
7 |
-
"eval_steps_per_second": 1.
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
+
"eval_loss": 0.9360852241516113,
|
4 |
+
"eval_runtime": 142.4913,
|
5 |
"eval_samples": 23110,
|
6 |
+
"eval_samples_per_second": 108.294,
|
7 |
+
"eval_steps_per_second": 1.698
|
8 |
}
|
model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4943162336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d962f5f669d3b46ec1ee3f616d374040c5b5341d94e31eb87c37b783850a6941
|
3 |
size 4943162336
|
model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999819336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70645b2075d65260c14c0cd5b6587092bf6ad7baf2ec58bacb170f20d06b8453
|
3 |
size 4999819336
|
model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4540516344
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44584b41e975a724de8f368833fca905f60dd80bdc3307178aab1a1b9ca18e07
|
3 |
size 4540516344
|
runs/Jan04_11-14-47_ip-26-0-173-202/events.out.tfevents.1704366960.ip-26-0-173-202.768748.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd81d94fbac36a437fc4f0ee2b90ef0985a241c1709771aec78e28d8d52ca9e3
|
3 |
+
size 7882
|
runs/Jan04_11-14-47_ip-26-0-173-202/events.out.tfevents.1704367666.ip-26-0-173-202.768748.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:432bf01d585d5a919362be4a588de1d99f432349fe1d563ac4f6d96a799a4f21
|
3 |
+
size 359
|
train_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
-
"train_loss": 0.
|
4 |
-
"train_runtime": 563.
|
5 |
"train_samples": 207865,
|
6 |
-
"train_samples_per_second": 247.
|
7 |
-
"train_steps_per_second": 1.
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
+
"train_loss": 0.07633398782222643,
|
4 |
+
"train_runtime": 563.604,
|
5 |
"train_samples": 207865,
|
6 |
+
"train_samples_per_second": 247.383,
|
7 |
+
"train_steps_per_second": 1.934
|
8 |
}
|
trainer_state.json
CHANGED
@@ -1217,13 +1217,13 @@
|
|
1217 |
{
|
1218 |
"epoch": 0.92,
|
1219 |
"learning_rate": 2.985942075541848e-07,
|
1220 |
-
"loss": 0.
|
1221 |
"step": 1005
|
1222 |
},
|
1223 |
{
|
1224 |
"epoch": 0.93,
|
1225 |
"learning_rate": 2.646499188279328e-07,
|
1226 |
-
"loss": 0.
|
1227 |
"step": 1010
|
1228 |
},
|
1229 |
{
|
@@ -1283,7 +1283,7 @@
|
|
1283 |
{
|
1284 |
"epoch": 0.97,
|
1285 |
"learning_rate": 3.735843446830867e-08,
|
1286 |
-
"loss": 0.
|
1287 |
"step": 1060
|
1288 |
},
|
1289 |
{
|
@@ -1301,7 +1301,7 @@
|
|
1301 |
{
|
1302 |
"epoch": 0.99,
|
1303 |
"learning_rate": 9.343974109685684e-09,
|
1304 |
-
"loss": 0.
|
1305 |
"step": 1075
|
1306 |
},
|
1307 |
{
|
@@ -1324,9 +1324,9 @@
|
|
1324 |
},
|
1325 |
{
|
1326 |
"epoch": 1.0,
|
1327 |
-
"eval_loss": 0.
|
1328 |
-
"eval_runtime": 143.
|
1329 |
-
"eval_samples_per_second": 107.
|
1330 |
"eval_steps_per_second": 1.688,
|
1331 |
"step": 1090
|
1332 |
},
|
@@ -1334,10 +1334,10 @@
|
|
1334 |
"epoch": 1.0,
|
1335 |
"step": 1090,
|
1336 |
"total_flos": 456447649382400.0,
|
1337 |
-
"train_loss": 0.
|
1338 |
-
"train_runtime": 563.
|
1339 |
-
"train_samples_per_second": 247.
|
1340 |
-
"train_steps_per_second": 1.
|
1341 |
}
|
1342 |
],
|
1343 |
"logging_steps": 5,
|
|
|
1217 |
{
|
1218 |
"epoch": 0.92,
|
1219 |
"learning_rate": 2.985942075541848e-07,
|
1220 |
+
"loss": 0.9266,
|
1221 |
"step": 1005
|
1222 |
},
|
1223 |
{
|
1224 |
"epoch": 0.93,
|
1225 |
"learning_rate": 2.646499188279328e-07,
|
1226 |
+
"loss": 0.912,
|
1227 |
"step": 1010
|
1228 |
},
|
1229 |
{
|
|
|
1283 |
{
|
1284 |
"epoch": 0.97,
|
1285 |
"learning_rate": 3.735843446830867e-08,
|
1286 |
+
"loss": 0.9227,
|
1287 |
"step": 1060
|
1288 |
},
|
1289 |
{
|
|
|
1301 |
{
|
1302 |
"epoch": 0.99,
|
1303 |
"learning_rate": 9.343974109685684e-09,
|
1304 |
+
"loss": 0.9277,
|
1305 |
"step": 1075
|
1306 |
},
|
1307 |
{
|
|
|
1324 |
},
|
1325 |
{
|
1326 |
"epoch": 1.0,
|
1327 |
+
"eval_loss": 0.9360852241516113,
|
1328 |
+
"eval_runtime": 143.326,
|
1329 |
+
"eval_samples_per_second": 107.664,
|
1330 |
"eval_steps_per_second": 1.688,
|
1331 |
"step": 1090
|
1332 |
},
|
|
|
1334 |
"epoch": 1.0,
|
1335 |
"step": 1090,
|
1336 |
"total_flos": 456447649382400.0,
|
1337 |
+
"train_loss": 0.07633398782222643,
|
1338 |
+
"train_runtime": 563.604,
|
1339 |
+
"train_samples_per_second": 247.383,
|
1340 |
+
"train_steps_per_second": 1.934
|
1341 |
}
|
1342 |
],
|
1343 |
"logging_steps": 5,
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebb8b817065113f0d4164ec672e5ca229a3f452e5837c978813720b0f6564d8e
|
3 |
size 5880
|