lewtun HF staff commited on
Commit
72c68ee
1 Parent(s): e8a39de

Model save

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 1.0,
3
- "eval_loss": 0.9360857009887695,
4
- "eval_runtime": 142.4328,
5
  "eval_samples": 23110,
6
- "eval_samples_per_second": 108.339,
7
- "eval_steps_per_second": 1.699,
8
- "train_loss": 0.07633444366105106,
9
- "train_runtime": 563.397,
10
  "train_samples": 207865,
11
- "train_samples_per_second": 247.474,
12
- "train_steps_per_second": 1.935
13
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "eval_loss": 0.9360852241516113,
4
+ "eval_runtime": 142.4913,
5
  "eval_samples": 23110,
6
+ "eval_samples_per_second": 108.294,
7
+ "eval_steps_per_second": 1.698,
8
+ "train_loss": 0.07633398782222643,
9
+ "train_runtime": 563.604,
10
  "train_samples": 207865,
11
+ "train_samples_per_second": 247.383,
12
+ "train_steps_per_second": 1.934
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "eval_loss": 0.9360857009887695,
4
- "eval_runtime": 142.4328,
5
  "eval_samples": 23110,
6
- "eval_samples_per_second": 108.339,
7
- "eval_steps_per_second": 1.699
8
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "eval_loss": 0.9360852241516113,
4
+ "eval_runtime": 142.4913,
5
  "eval_samples": 23110,
6
+ "eval_samples_per_second": 108.294,
7
+ "eval_steps_per_second": 1.698
8
  }
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f785798732c7ef26d34f5056ed95c789cca31876fc2729a8688e91a64f158975
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d962f5f669d3b46ec1ee3f616d374040c5b5341d94e31eb87c37b783850a6941
3
  size 4943162336
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:177eaac08f7ca90baa649f6c2eb979843b9bdd29897c8f18f53902c60c19df52
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70645b2075d65260c14c0cd5b6587092bf6ad7baf2ec58bacb170f20d06b8453
3
  size 4999819336
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e07e16b881fdcd0767315f89c90e17b12c08f7fa9626f3a9c98af34ef8e11de
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44584b41e975a724de8f368833fca905f60dd80bdc3307178aab1a1b9ca18e07
3
  size 4540516344
runs/Jan04_11-14-47_ip-26-0-173-202/events.out.tfevents.1704366960.ip-26-0-173-202.768748.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd81d94fbac36a437fc4f0ee2b90ef0985a241c1709771aec78e28d8d52ca9e3
3
+ size 7882
runs/Jan04_11-14-47_ip-26-0-173-202/events.out.tfevents.1704367666.ip-26-0-173-202.768748.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:432bf01d585d5a919362be4a588de1d99f432349fe1d563ac4f6d96a799a4f21
3
+ size 359
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 0.07633444366105106,
4
- "train_runtime": 563.397,
5
  "train_samples": 207865,
6
- "train_samples_per_second": 247.474,
7
- "train_steps_per_second": 1.935
8
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 0.07633398782222643,
4
+ "train_runtime": 563.604,
5
  "train_samples": 207865,
6
+ "train_samples_per_second": 247.383,
7
+ "train_steps_per_second": 1.934
8
  }
trainer_state.json CHANGED
@@ -1217,13 +1217,13 @@
1217
  {
1218
  "epoch": 0.92,
1219
  "learning_rate": 2.985942075541848e-07,
1220
- "loss": 0.9267,
1221
  "step": 1005
1222
  },
1223
  {
1224
  "epoch": 0.93,
1225
  "learning_rate": 2.646499188279328e-07,
1226
- "loss": 0.9119,
1227
  "step": 1010
1228
  },
1229
  {
@@ -1283,7 +1283,7 @@
1283
  {
1284
  "epoch": 0.97,
1285
  "learning_rate": 3.735843446830867e-08,
1286
- "loss": 0.9228,
1287
  "step": 1060
1288
  },
1289
  {
@@ -1301,7 +1301,7 @@
1301
  {
1302
  "epoch": 0.99,
1303
  "learning_rate": 9.343974109685684e-09,
1304
- "loss": 0.9278,
1305
  "step": 1075
1306
  },
1307
  {
@@ -1324,9 +1324,9 @@
1324
  },
1325
  {
1326
  "epoch": 1.0,
1327
- "eval_loss": 0.9360857009887695,
1328
- "eval_runtime": 143.3612,
1329
- "eval_samples_per_second": 107.637,
1330
  "eval_steps_per_second": 1.688,
1331
  "step": 1090
1332
  },
@@ -1334,10 +1334,10 @@
1334
  "epoch": 1.0,
1335
  "step": 1090,
1336
  "total_flos": 456447649382400.0,
1337
- "train_loss": 0.07633444366105106,
1338
- "train_runtime": 563.397,
1339
- "train_samples_per_second": 247.474,
1340
- "train_steps_per_second": 1.935
1341
  }
1342
  ],
1343
  "logging_steps": 5,
 
1217
  {
1218
  "epoch": 0.92,
1219
  "learning_rate": 2.985942075541848e-07,
1220
+ "loss": 0.9266,
1221
  "step": 1005
1222
  },
1223
  {
1224
  "epoch": 0.93,
1225
  "learning_rate": 2.646499188279328e-07,
1226
+ "loss": 0.912,
1227
  "step": 1010
1228
  },
1229
  {
 
1283
  {
1284
  "epoch": 0.97,
1285
  "learning_rate": 3.735843446830867e-08,
1286
+ "loss": 0.9227,
1287
  "step": 1060
1288
  },
1289
  {
 
1301
  {
1302
  "epoch": 0.99,
1303
  "learning_rate": 9.343974109685684e-09,
1304
+ "loss": 0.9277,
1305
  "step": 1075
1306
  },
1307
  {
 
1324
  },
1325
  {
1326
  "epoch": 1.0,
1327
+ "eval_loss": 0.9360852241516113,
1328
+ "eval_runtime": 143.326,
1329
+ "eval_samples_per_second": 107.664,
1330
  "eval_steps_per_second": 1.688,
1331
  "step": 1090
1332
  },
 
1334
  "epoch": 1.0,
1335
  "step": 1090,
1336
  "total_flos": 456447649382400.0,
1337
+ "train_loss": 0.07633398782222643,
1338
+ "train_runtime": 563.604,
1339
+ "train_samples_per_second": 247.383,
1340
+ "train_steps_per_second": 1.934
1341
  }
1342
  ],
1343
  "logging_steps": 5,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0691346a7ead143f31dee13e381834e39d381f00c48ab175103779bd8ed770fd
3
  size 5880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebb8b817065113f0d4164ec672e5ca229a3f452e5837c978813720b0f6564d8e
3
  size 5880