cruiser commited on
Commit
e56346e
·
1 Parent(s): 8f02ea5

Training in progress, epoch 2

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6da5cd4b0656262aa2c5e33402b4ea5a9c30124eb96f4ad5b6f04869f81c36e
3
  size 535707205
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6b43d784e08c955dcffa035b182ea3ad7778e8bf7c1ae13d24dd5bb390a8f02
3
  size 535707205
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:140674d2406857363e180b3415c2e2a7fcea896327f3aab36609b258e2b89e55
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d01fd0df85ed20d98b1b2d1f341bb4c14f6e0e0439fb8f078c1b00d663c05d4
3
  size 267858605
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1afa4fb390fed62209a33ec31502a83421450b5e725ed87b9f6a0e5a6fe43e4a
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec413b9ccb2e7bf299f05612d1ea984d788cd968b214a3f7972297c05d91216b
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8887e02a63197212eb08e6268a00af8c32453672a22c577dcf1de8bc5e2b976a
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7524676a9651ec8c0d685a583a2fce1a7529148810db182eac434accbd0d75cb
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.5497974753379822,
3
- "best_model_checkpoint": "distilbert_final_config_dropout/checkpoint-1718",
4
- "epoch": 1.0,
5
- "global_step": 1718,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -34,11 +34,39 @@
34
  "eval_samples_per_second": 433.946,
35
  "eval_steps_per_second": 27.137,
36
  "step": 1718
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
37
  }
38
  ],
39
  "max_steps": 34360,
40
  "num_train_epochs": 20,
41
- "total_flos": 782117510345820.0,
42
  "trial_name": null,
43
  "trial_params": null
44
  }
 
1
  {
2
+ "best_metric": 0.5246105790138245,
3
+ "best_model_checkpoint": "distilbert_final_config_dropout/checkpoint-3436",
4
+ "epoch": 2.0,
5
+ "global_step": 3436,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
34
  "eval_samples_per_second": 433.946,
35
  "eval_steps_per_second": 27.137,
36
  "step": 1718
37
+ },
38
+ {
39
+ "epoch": 1.16,
40
+ "learning_rate": 1.8835855646100117e-05,
41
+ "loss": 0.4957,
42
+ "step": 2000
43
+ },
44
+ {
45
+ "epoch": 1.46,
46
+ "learning_rate": 1.8544819557625148e-05,
47
+ "loss": 0.4703,
48
+ "step": 2500
49
+ },
50
+ {
51
+ "epoch": 1.75,
52
+ "learning_rate": 1.825378346915018e-05,
53
+ "loss": 0.4683,
54
+ "step": 3000
55
+ },
56
+ {
57
+ "epoch": 2.0,
58
+ "eval_accuracy": 0.7920203735144312,
59
+ "eval_f1": 0.7952858811810856,
60
+ "eval_loss": 0.5246105790138245,
61
+ "eval_runtime": 8.0847,
62
+ "eval_samples_per_second": 437.12,
63
+ "eval_steps_per_second": 27.335,
64
+ "step": 3436
65
  }
66
  ],
67
  "max_steps": 34360,
68
  "num_train_epochs": 20,
69
+ "total_flos": 1564235020691640.0,
70
  "trial_name": null,
71
  "trial_params": null
72
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:140674d2406857363e180b3415c2e2a7fcea896327f3aab36609b258e2b89e55
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d01fd0df85ed20d98b1b2d1f341bb4c14f6e0e0439fb8f078c1b00d663c05d4
3
  size 267858605
runs/May01_07-08-02_af1ffd0a72ec/events.out.tfevents.1682924887.af1ffd0a72ec.975.14 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9308464d673553c8070019e7feb9e18bc47465f1f244a6a92744101727de3da
3
- size 4840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25999dc32109a70630c9f5cadb50d2f3c2ab0c2201b252655ca050efb1ee78c8
3
+ size 5680