Shresthadev403 commited on
Commit
f35d8c4
·
verified ·
1 Parent(s): 57368ad

End of training

Browse files
README.md CHANGED
@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  This model was trained from scratch on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
- - Loss: 1.5255
17
 
18
  ## Model description
19
 
 
13
 
14
  This model was trained from scratch on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
+ - Loss: 1.4377
17
 
18
  ## Model description
19
 
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47ba5eceb8f9e87cdb1f103986dbd1995ba6e02107d2e46434a3f3334766ea69
3
  size 535667604
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33572d875c77405045bee1e1b6d196f3275e0230d0283937f3dd3a376f0bc665
3
  size 535667604
runs/Jan22_02-43-32_fbf1b033956c/events.out.tfevents.1705891414.fbf1b033956c.26.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4265bb71d1e21980073d9be0f5fca5978e1d19a43098ab6b9ad0f7344179bbf9
3
- size 1718246
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05e58c37b81af20ab189b8b9620c8318b1c4301baa70ed985ad5d8eafe0372f6
3
+ size 1718674
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 1.4617092609405518,
3
  "best_model_checkpoint": "ner-bert-ingredientstesting/checkpoint-9000",
4
- "epoch": 16.17143819467834,
5
  "eval_steps": 750,
6
- "global_step": 12000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -240,6 +240,20 @@
240
  "eval_samples_per_second": 59.118,
241
  "eval_steps_per_second": 0.934,
242
  "step": 12000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
243
  }
244
  ],
245
  "logging_steps": 750,
@@ -247,7 +261,7 @@
247
  "num_input_tokens_seen": 0,
248
  "num_train_epochs": 100,
249
  "save_steps": 750,
250
- "total_flos": 5.193603944146944e+17,
251
  "train_batch_size": 16,
252
  "trial_name": null,
253
  "trial_params": null
 
1
  {
2
  "best_metric": 1.4617092609405518,
3
  "best_model_checkpoint": "ner-bert-ingredientstesting/checkpoint-9000",
4
+ "epoch": 17.181879420680364,
5
  "eval_steps": 750,
6
+ "global_step": 12750,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
240
  "eval_samples_per_second": 59.118,
241
  "eval_steps_per_second": 0.934,
242
  "step": 12000
243
+ },
244
+ {
245
+ "epoch": 17.18,
246
+ "learning_rate": 4.7979110512129385e-05,
247
+ "loss": 0.9732,
248
+ "step": 12750
249
+ },
250
+ {
251
+ "epoch": 17.18,
252
+ "eval_loss": 1.4376968145370483,
253
+ "eval_runtime": 84.6742,
254
+ "eval_samples_per_second": 59.05,
255
+ "eval_steps_per_second": 0.933,
256
+ "step": 12750
257
  }
258
  ],
259
  "logging_steps": 750,
 
261
  "num_input_tokens_seen": 0,
262
  "num_train_epochs": 100,
263
  "save_steps": 750,
264
+ "total_flos": 5.5182024998977536e+17,
265
  "train_batch_size": 16,
266
  "trial_name": null,
267
  "trial_params": null