einargizz commited on
Commit
919bc63
1 Parent(s): 30f93fe

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 1.0,
3
- "eval_loss": 0.6321855187416077,
4
- "eval_runtime": 71.348,
5
- "eval_samples": 250,
6
- "eval_samples_per_second": 3.504,
7
- "eval_steps_per_second": 0.224,
8
- "eval_wer": 45.68657478305258,
9
- "train_loss": 1.2054000387191772,
10
- "train_runtime": 15609.5124,
11
- "train_samples_per_second": 4.1,
12
- "train_steps_per_second": 0.064
13
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "eval_loss": 0.6313478946685791,
4
+ "eval_runtime": 711.2452,
5
+ "eval_samples": 500,
6
+ "eval_samples_per_second": 0.703,
7
+ "eval_steps_per_second": 0.045,
8
+ "eval_wer": 45.29159303206261,
9
+ "train_loss": 1.2053918581008911,
10
+ "train_runtime": 78451.7893,
11
+ "train_samples_per_second": 0.816,
12
+ "train_steps_per_second": 0.013
13
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 1.0,
3
- "eval_loss": 0.6321855187416077,
4
- "eval_runtime": 71.348,
5
- "eval_samples": 250,
6
- "eval_samples_per_second": 3.504,
7
- "eval_steps_per_second": 0.224,
8
- "eval_wer": 45.68657478305258
9
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "eval_loss": 0.6313478946685791,
4
+ "eval_runtime": 711.2452,
5
+ "eval_samples": 500,
6
+ "eval_samples_per_second": 0.703,
7
+ "eval_steps_per_second": 0.045,
8
+ "eval_wer": 45.29159303206261
9
  }
runs/Mar29_09-18-59_terra/events.out.tfevents.1680160948.terra.179326.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a0597c554d7d50a6ca7d2c2acbd35225e4bbdb209c21ee5b1f23748eed6c687
3
+ size 406
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 1.2054000387191772,
4
- "train_runtime": 15609.5124,
5
- "train_samples_per_second": 4.1,
6
- "train_steps_per_second": 0.064
7
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 1.2053918581008911,
4
+ "train_runtime": 78451.7893,
5
+ "train_samples_per_second": 0.816,
6
+ "train_steps_per_second": 0.013
7
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 45.68657478305258,
3
  "best_model_checkpoint": "./output/checkpoint-1000",
4
  "epoch": 1.0,
5
  "global_step": 1000,
@@ -69,11 +69,11 @@
69
  },
70
  {
71
  "epoch": 0.25,
72
- "eval_loss": 1.5133659839630127,
73
- "eval_runtime": 49.0888,
74
- "eval_samples_per_second": 5.093,
75
- "eval_steps_per_second": 0.326,
76
- "eval_wer": 79.0199081163859,
77
  "step": 250
78
  },
79
  {
@@ -85,13 +85,13 @@
85
  {
86
  "epoch": 0.3,
87
  "learning_rate": 5.9600000000000005e-06,
88
- "loss": 1.3248,
89
  "step": 300
90
  },
91
  {
92
  "epoch": 0.33,
93
  "learning_rate": 6.460000000000001e-06,
94
- "loss": 1.2724,
95
  "step": 325
96
  },
97
  {
@@ -103,7 +103,7 @@
103
  {
104
  "epoch": 0.38,
105
  "learning_rate": 7.4600000000000006e-06,
106
- "loss": 1.0426,
107
  "step": 375
108
  },
109
  {
@@ -133,16 +133,16 @@
133
  {
134
  "epoch": 0.5,
135
  "learning_rate": 9.960000000000001e-06,
136
- "loss": 0.7719,
137
  "step": 500
138
  },
139
  {
140
  "epoch": 0.5,
141
- "eval_loss": 0.8723946213722229,
142
- "eval_runtime": 42.8226,
143
- "eval_samples_per_second": 5.838,
144
- "eval_steps_per_second": 0.374,
145
- "eval_wer": 61.20469627360898,
146
  "step": 500
147
  },
148
  {
@@ -154,7 +154,7 @@
154
  {
155
  "epoch": 0.55,
156
  "learning_rate": 9.040000000000002e-06,
157
- "loss": 0.7805,
158
  "step": 550
159
  },
160
  {
@@ -166,7 +166,7 @@
166
  {
167
  "epoch": 0.6,
168
  "learning_rate": 8.040000000000001e-06,
169
- "loss": 0.8321,
170
  "step": 600
171
  },
172
  {
@@ -196,7 +196,7 @@
196
  {
197
  "epoch": 0.72,
198
  "learning_rate": 5.540000000000001e-06,
199
- "loss": 0.7312,
200
  "step": 725
201
  },
202
  {
@@ -207,11 +207,11 @@
207
  },
208
  {
209
  "epoch": 0.75,
210
- "eval_loss": 0.6546878814697266,
211
- "eval_runtime": 41.6435,
212
- "eval_samples_per_second": 6.003,
213
- "eval_steps_per_second": 0.384,
214
- "eval_wer": 47.32006125574272,
215
  "step": 750
216
  },
217
  {
@@ -223,19 +223,19 @@
223
  {
224
  "epoch": 0.8,
225
  "learning_rate": 4.04e-06,
226
- "loss": 0.8042,
227
  "step": 800
228
  },
229
  {
230
  "epoch": 0.82,
231
  "learning_rate": 3.54e-06,
232
- "loss": 0.6615,
233
  "step": 825
234
  },
235
  {
236
  "epoch": 0.85,
237
  "learning_rate": 3.04e-06,
238
- "loss": 0.663,
239
  "step": 850
240
  },
241
  {
@@ -265,32 +265,32 @@
265
  {
266
  "epoch": 0.97,
267
  "learning_rate": 5.4e-07,
268
- "loss": 0.5841,
269
  "step": 975
270
  },
271
  {
272
  "epoch": 1.0,
273
  "learning_rate": 4e-08,
274
- "loss": 0.5734,
275
  "step": 1000
276
  },
277
  {
278
  "epoch": 1.0,
279
- "eval_loss": 0.6321855187416077,
280
- "eval_runtime": 76.4524,
281
- "eval_samples_per_second": 3.27,
282
- "eval_steps_per_second": 0.209,
283
- "eval_wer": 45.68657478305258,
284
  "step": 1000
285
  },
286
  {
287
  "epoch": 1.0,
288
  "step": 1000,
289
  "total_flos": 1.57560864768e+18,
290
- "train_loss": 1.2054000387191772,
291
- "train_runtime": 15609.5124,
292
- "train_samples_per_second": 4.1,
293
- "train_steps_per_second": 0.064
294
  }
295
  ],
296
  "max_steps": 1000,
 
1
  {
2
+ "best_metric": 45.29159303206261,
3
  "best_model_checkpoint": "./output/checkpoint-1000",
4
  "epoch": 1.0,
5
  "global_step": 1000,
 
69
  },
70
  {
71
  "epoch": 0.25,
72
+ "eval_loss": 1.4900375604629517,
73
+ "eval_runtime": 696.9939,
74
+ "eval_samples_per_second": 0.717,
75
+ "eval_steps_per_second": 0.046,
76
+ "eval_wer": 77.9348649330977,
77
  "step": 250
78
  },
79
  {
 
85
  {
86
  "epoch": 0.3,
87
  "learning_rate": 5.9600000000000005e-06,
88
+ "loss": 1.3247,
89
  "step": 300
90
  },
91
  {
92
  "epoch": 0.33,
93
  "learning_rate": 6.460000000000001e-06,
94
+ "loss": 1.2725,
95
  "step": 325
96
  },
97
  {
 
103
  {
104
  "epoch": 0.38,
105
  "learning_rate": 7.4600000000000006e-06,
106
+ "loss": 1.0425,
107
  "step": 375
108
  },
109
  {
 
133
  {
134
  "epoch": 0.5,
135
  "learning_rate": 9.960000000000001e-06,
136
+ "loss": 0.7722,
137
  "step": 500
138
  },
139
  {
140
  "epoch": 0.5,
141
+ "eval_loss": 0.8731086850166321,
142
+ "eval_runtime": 702.8815,
143
+ "eval_samples_per_second": 0.711,
144
+ "eval_steps_per_second": 0.046,
145
+ "eval_wer": 60.28780610956829,
146
  "step": 500
147
  },
148
  {
 
154
  {
155
  "epoch": 0.55,
156
  "learning_rate": 9.040000000000002e-06,
157
+ "loss": 0.7804,
158
  "step": 550
159
  },
160
  {
 
166
  {
167
  "epoch": 0.6,
168
  "learning_rate": 8.040000000000001e-06,
169
+ "loss": 0.832,
170
  "step": 600
171
  },
172
  {
 
196
  {
197
  "epoch": 0.72,
198
  "learning_rate": 5.540000000000001e-06,
199
+ "loss": 0.731,
200
  "step": 725
201
  },
202
  {
 
207
  },
208
  {
209
  "epoch": 0.75,
210
+ "eval_loss": 0.6534215211868286,
211
+ "eval_runtime": 681.508,
212
+ "eval_samples_per_second": 0.734,
213
+ "eval_steps_per_second": 0.047,
214
+ "eval_wer": 46.50340823024489,
215
  "step": 750
216
  },
217
  {
 
223
  {
224
  "epoch": 0.8,
225
  "learning_rate": 4.04e-06,
226
+ "loss": 0.8043,
227
  "step": 800
228
  },
229
  {
230
  "epoch": 0.82,
231
  "learning_rate": 3.54e-06,
232
+ "loss": 0.6616,
233
  "step": 825
234
  },
235
  {
236
  "epoch": 0.85,
237
  "learning_rate": 3.04e-06,
238
+ "loss": 0.6631,
239
  "step": 850
240
  },
241
  {
 
265
  {
266
  "epoch": 0.97,
267
  "learning_rate": 5.4e-07,
268
+ "loss": 0.5842,
269
  "step": 975
270
  },
271
  {
272
  "epoch": 1.0,
273
  "learning_rate": 4e-08,
274
+ "loss": 0.5733,
275
  "step": 1000
276
  },
277
  {
278
  "epoch": 1.0,
279
+ "eval_loss": 0.6313478946685791,
280
+ "eval_runtime": 708.6015,
281
+ "eval_samples_per_second": 0.706,
282
+ "eval_steps_per_second": 0.045,
283
+ "eval_wer": 45.29159303206261,
284
  "step": 1000
285
  },
286
  {
287
  "epoch": 1.0,
288
  "step": 1000,
289
  "total_flos": 1.57560864768e+18,
290
+ "train_loss": 1.2053918581008911,
291
+ "train_runtime": 78451.7893,
292
+ "train_samples_per_second": 0.816,
293
+ "train_steps_per_second": 0.013
294
  }
295
  ],
296
  "max_steps": 1000,