Shresthadev403 commited on
Commit
07713b6
·
verified ·
1 Parent(s): c914d6c

End of training

Browse files
README.md CHANGED
@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  This model was trained from scratch on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
- - Loss: 3.2860
17
 
18
  ## Model description
19
 
 
13
 
14
  This model was trained from scratch on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
+ - Loss: 2.4815
17
 
18
  ## Model description
19
 
logs/events.out.tfevents.1705498568.ed78651fcb5b.26.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f137b2c4f982df40b1835165df2efb0b8d6ecb9c0e36684e7019bb5f066d085
3
- size 1717786
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:695082ab22efaef9ae2a297e5a205acc1918b02972150fb6ff7ad1f538045453
3
+ size 1718214
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa878307e27c74d382612902a7b9e4c7ff9c804b946271146df2ac84b664ed5d
3
  size 535667604
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:312cf3588bb2cc38a8915a7119b0def981af42e9748073c024ef0e663cd9602c
3
  size 535667604
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 9.694682121276855,
3
- "best_model_checkpoint": "ner-bert-ingredientstesting/checkpoint-750",
4
- "epoch": 2.0212192657460424,
5
  "eval_steps": 750,
6
- "global_step": 1500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -44,6 +44,20 @@
44
  "eval_samples_per_second": 59.268,
45
  "eval_steps_per_second": 0.936,
46
  "step": 1500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
  }
48
  ],
49
  "logging_steps": 750,
@@ -51,7 +65,7 @@
51
  "num_input_tokens_seen": 0,
52
  "num_train_epochs": 50,
53
  "save_steps": 750,
54
- "total_flos": 6.492241636356096e+16,
55
  "train_batch_size": 16,
56
  "trial_name": null,
57
  "trial_params": null
 
1
  {
2
+ "best_metric": 3.2859976291656494,
3
+ "best_model_checkpoint": "ner-bert-ingredientstesting/checkpoint-1500",
4
+ "epoch": 3.031660491748063,
5
  "eval_steps": 750,
6
+ "global_step": 2250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
44
  "eval_samples_per_second": 59.268,
45
  "eval_steps_per_second": 0.936,
46
  "step": 1500
47
+ },
48
+ {
49
+ "epoch": 3.03,
50
+ "learning_rate": 4.796900269541779e-05,
51
+ "loss": 2.8798,
52
+ "step": 2250
53
+ },
54
+ {
55
+ "epoch": 3.03,
56
+ "eval_loss": 2.4815261363983154,
57
+ "eval_runtime": 84.3896,
58
+ "eval_samples_per_second": 59.249,
59
+ "eval_steps_per_second": 0.936,
60
+ "step": 2250
61
  }
62
  ],
63
  "logging_steps": 750,
 
65
  "num_input_tokens_seen": 0,
66
  "num_train_epochs": 50,
67
  "save_steps": 750,
68
+ "total_flos": 9.738227193864192e+16,
69
  "train_batch_size": 16,
70
  "trial_name": null,
71
  "trial_params": null