cruiser commited on
Commit
a5780cd
·
1 Parent(s): e56346e

Training in progress, epoch 3

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6b43d784e08c955dcffa035b182ea3ad7778e8bf7c1ae13d24dd5bb390a8f02
3
  size 535707205
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eff679c74112e14072c551bd9d3c2b560f0f107e30a9249c78ce99123c9ce24e
3
  size 535707205
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d01fd0df85ed20d98b1b2d1f341bb4c14f6e0e0439fb8f078c1b00d663c05d4
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bda6c1fc6a88fe6b9030005770ba7f46419356865032d57318a97472d081ccf
3
  size 267858605
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec413b9ccb2e7bf299f05612d1ea984d788cd968b214a3f7972297c05d91216b
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47fe60f138b6682f4f11f1710b9ddc0fb2882408668973136d874097a9110f35
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7524676a9651ec8c0d685a583a2fce1a7529148810db182eac434accbd0d75cb
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:418275b5fc548956987d7f03901d0cd4d34ba2005600e9bf3d5900b248c41079
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.5246105790138245,
3
- "best_model_checkpoint": "distilbert_final_config_dropout/checkpoint-3436",
4
- "epoch": 2.0,
5
- "global_step": 3436,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -62,11 +62,45 @@
62
  "eval_samples_per_second": 437.12,
63
  "eval_steps_per_second": 27.335,
64
  "step": 3436
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  }
66
  ],
67
  "max_steps": 34360,
68
  "num_train_epochs": 20,
69
- "total_flos": 1564235020691640.0,
70
  "trial_name": null,
71
  "trial_params": null
72
  }
 
1
  {
2
+ "best_metric": 0.5194681286811829,
3
+ "best_model_checkpoint": "distilbert_final_config_dropout/checkpoint-5154",
4
+ "epoch": 3.0,
5
+ "global_step": 5154,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
62
  "eval_samples_per_second": 437.12,
63
  "eval_steps_per_second": 27.335,
64
  "step": 3436
65
+ },
66
+ {
67
+ "epoch": 2.04,
68
+ "learning_rate": 1.7962747380675206e-05,
69
+ "loss": 0.4785,
70
+ "step": 3500
71
+ },
72
+ {
73
+ "epoch": 2.33,
74
+ "learning_rate": 1.7671711292200233e-05,
75
+ "loss": 0.3916,
76
+ "step": 4000
77
+ },
78
+ {
79
+ "epoch": 2.62,
80
+ "learning_rate": 1.7380675203725264e-05,
81
+ "loss": 0.3933,
82
+ "step": 4500
83
+ },
84
+ {
85
+ "epoch": 2.91,
86
+ "learning_rate": 1.708963911525029e-05,
87
+ "loss": 0.4015,
88
+ "step": 5000
89
+ },
90
+ {
91
+ "epoch": 3.0,
92
+ "eval_accuracy": 0.7934352009054896,
93
+ "eval_f1": 0.7969035613432119,
94
+ "eval_loss": 0.5194681286811829,
95
+ "eval_runtime": 8.124,
96
+ "eval_samples_per_second": 435.009,
97
+ "eval_steps_per_second": 27.203,
98
+ "step": 5154
99
  }
100
  ],
101
  "max_steps": 34360,
102
  "num_train_epochs": 20,
103
+ "total_flos": 2346352531037460.0,
104
  "trial_name": null,
105
  "trial_params": null
106
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d01fd0df85ed20d98b1b2d1f341bb4c14f6e0e0439fb8f078c1b00d663c05d4
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bda6c1fc6a88fe6b9030005770ba7f46419356865032d57318a97472d081ccf
3
  size 267858605
runs/May01_07-08-02_af1ffd0a72ec/events.out.tfevents.1682924887.af1ffd0a72ec.975.14 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25999dc32109a70630c9f5cadb50d2f3c2ab0c2201b252655ca050efb1ee78c8
3
- size 5680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4253ab64691164f9ec1c66be035048819342001a460aa6a51a8435d125c6ce51
3
+ size 6677