djbp commited on
Commit
58233da
1 Parent(s): ec024bf

End of training

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.8819619527847811
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [microsoft/swin-base-patch4-window7-224-in22k](https://huggingface.co/microsoft/swin-base-patch4-window7-224-in22k) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.3085
36
- - Accuracy: 0.8820
37
 
38
  ## Model description
39
 
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.8837955535182214
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [microsoft/swin-base-patch4-window7-224-in22k](https://huggingface.co/microsoft/swin-base-patch4-window7-224-in22k) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.3017
36
+ - Accuracy: 0.8838
37
 
38
  ## Model description
39
 
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 6.948905109489051,
3
+ "eval_accuracy": 0.8837955535182214,
4
+ "eval_loss": 0.30171430110931396,
5
+ "eval_runtime": 34.4194,
6
+ "eval_samples_per_second": 126.76,
7
+ "eval_steps_per_second": 2.005,
8
+ "total_flos": 9.517373864500433e+18,
9
+ "train_loss": 0.3870567884765753,
10
+ "train_runtime": 2171.3346,
11
+ "train_samples_per_second": 56.33,
12
+ "train_steps_per_second": 0.219
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 6.948905109489051,
3
+ "eval_accuracy": 0.8837955535182214,
4
+ "eval_loss": 0.30171430110931396,
5
+ "eval_runtime": 34.4194,
6
+ "eval_samples_per_second": 126.76,
7
+ "eval_steps_per_second": 2.005
8
+ }
runs/Aug17_17-48-22_ccfb1a2839c5/events.out.tfevents.1723919121.ccfb1a2839c5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fa58bac5faa3e74413681163507c555387a16fcbea241f33e7fb17c5a9163cd
3
+ size 140
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 6.948905109489051,
3
+ "total_flos": 9.517373864500433e+18,
4
+ "train_loss": 0.3870567884765753,
5
+ "train_runtime": 2171.3346,
6
+ "train_samples_per_second": 56.33,
7
+ "train_steps_per_second": 0.219
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,434 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.8837955535182214,
3
+ "best_model_checkpoint": "swin-base-patch4-window7-224-in22k-MM_Classification_base_web_images/checkpoint-342",
4
+ "epoch": 6.948905109489051,
5
+ "eval_steps": 500,
6
+ "global_step": 476,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.145985401459854,
13
+ "grad_norm": 3.675107717514038,
14
+ "learning_rate": 1.0416666666666668e-05,
15
+ "loss": 1.0612,
16
+ "step": 10
17
+ },
18
+ {
19
+ "epoch": 0.291970802919708,
20
+ "grad_norm": 3.70519757270813,
21
+ "learning_rate": 2.0833333333333336e-05,
22
+ "loss": 0.8853,
23
+ "step": 20
24
+ },
25
+ {
26
+ "epoch": 0.43795620437956206,
27
+ "grad_norm": 3.8755295276641846,
28
+ "learning_rate": 3.125e-05,
29
+ "loss": 0.7099,
30
+ "step": 30
31
+ },
32
+ {
33
+ "epoch": 0.583941605839416,
34
+ "grad_norm": 2.727118492126465,
35
+ "learning_rate": 4.166666666666667e-05,
36
+ "loss": 0.6121,
37
+ "step": 40
38
+ },
39
+ {
40
+ "epoch": 0.7299270072992701,
41
+ "grad_norm": 3.260768175125122,
42
+ "learning_rate": 4.976635514018692e-05,
43
+ "loss": 0.5736,
44
+ "step": 50
45
+ },
46
+ {
47
+ "epoch": 0.8759124087591241,
48
+ "grad_norm": 5.847088813781738,
49
+ "learning_rate": 4.85981308411215e-05,
50
+ "loss": 0.517,
51
+ "step": 60
52
+ },
53
+ {
54
+ "epoch": 0.9927007299270073,
55
+ "eval_accuracy": 0.8157231262892505,
56
+ "eval_loss": 0.4430324137210846,
57
+ "eval_runtime": 35.8383,
58
+ "eval_samples_per_second": 121.741,
59
+ "eval_steps_per_second": 1.925,
60
+ "step": 68
61
+ },
62
+ {
63
+ "epoch": 1.0218978102189782,
64
+ "grad_norm": 5.806203365325928,
65
+ "learning_rate": 4.742990654205608e-05,
66
+ "loss": 0.4972,
67
+ "step": 70
68
+ },
69
+ {
70
+ "epoch": 1.167883211678832,
71
+ "grad_norm": 2.751803159713745,
72
+ "learning_rate": 4.6261682242990654e-05,
73
+ "loss": 0.4767,
74
+ "step": 80
75
+ },
76
+ {
77
+ "epoch": 1.313868613138686,
78
+ "grad_norm": 2.5074498653411865,
79
+ "learning_rate": 4.5093457943925236e-05,
80
+ "loss": 0.4509,
81
+ "step": 90
82
+ },
83
+ {
84
+ "epoch": 1.4598540145985401,
85
+ "grad_norm": 3.3779966831207275,
86
+ "learning_rate": 4.392523364485982e-05,
87
+ "loss": 0.4496,
88
+ "step": 100
89
+ },
90
+ {
91
+ "epoch": 1.6058394160583942,
92
+ "grad_norm": 4.8917741775512695,
93
+ "learning_rate": 4.27570093457944e-05,
94
+ "loss": 0.4528,
95
+ "step": 110
96
+ },
97
+ {
98
+ "epoch": 1.7518248175182483,
99
+ "grad_norm": 4.1523966789245605,
100
+ "learning_rate": 4.1588785046728974e-05,
101
+ "loss": 0.4535,
102
+ "step": 120
103
+ },
104
+ {
105
+ "epoch": 1.897810218978102,
106
+ "grad_norm": 6.303163051605225,
107
+ "learning_rate": 4.0420560747663556e-05,
108
+ "loss": 0.4211,
109
+ "step": 130
110
+ },
111
+ {
112
+ "epoch": 2.0,
113
+ "eval_accuracy": 0.8457483382993353,
114
+ "eval_loss": 0.38001278042793274,
115
+ "eval_runtime": 36.8858,
116
+ "eval_samples_per_second": 118.284,
117
+ "eval_steps_per_second": 1.871,
118
+ "step": 137
119
+ },
120
+ {
121
+ "epoch": 2.0437956204379564,
122
+ "grad_norm": 6.562156677246094,
123
+ "learning_rate": 3.925233644859813e-05,
124
+ "loss": 0.4435,
125
+ "step": 140
126
+ },
127
+ {
128
+ "epoch": 2.18978102189781,
129
+ "grad_norm": 3.601300001144409,
130
+ "learning_rate": 3.808411214953271e-05,
131
+ "loss": 0.3971,
132
+ "step": 150
133
+ },
134
+ {
135
+ "epoch": 2.335766423357664,
136
+ "grad_norm": 4.384274005889893,
137
+ "learning_rate": 3.691588785046729e-05,
138
+ "loss": 0.4075,
139
+ "step": 160
140
+ },
141
+ {
142
+ "epoch": 2.4817518248175183,
143
+ "grad_norm": 3.9660568237304688,
144
+ "learning_rate": 3.574766355140187e-05,
145
+ "loss": 0.3788,
146
+ "step": 170
147
+ },
148
+ {
149
+ "epoch": 2.627737226277372,
150
+ "grad_norm": 4.195096492767334,
151
+ "learning_rate": 3.457943925233645e-05,
152
+ "loss": 0.376,
153
+ "step": 180
154
+ },
155
+ {
156
+ "epoch": 2.7737226277372264,
157
+ "grad_norm": 3.6591451168060303,
158
+ "learning_rate": 3.341121495327103e-05,
159
+ "loss": 0.3514,
160
+ "step": 190
161
+ },
162
+ {
163
+ "epoch": 2.9197080291970803,
164
+ "grad_norm": 3.5800323486328125,
165
+ "learning_rate": 3.224299065420561e-05,
166
+ "loss": 0.3532,
167
+ "step": 200
168
+ },
169
+ {
170
+ "epoch": 2.9927007299270074,
171
+ "eval_accuracy": 0.8615631446252578,
172
+ "eval_loss": 0.3563055098056793,
173
+ "eval_runtime": 36.2136,
174
+ "eval_samples_per_second": 120.48,
175
+ "eval_steps_per_second": 1.905,
176
+ "step": 205
177
+ },
178
+ {
179
+ "epoch": 3.065693430656934,
180
+ "grad_norm": 6.1199421882629395,
181
+ "learning_rate": 3.107476635514019e-05,
182
+ "loss": 0.3963,
183
+ "step": 210
184
+ },
185
+ {
186
+ "epoch": 3.2116788321167884,
187
+ "grad_norm": 4.893133163452148,
188
+ "learning_rate": 2.9906542056074764e-05,
189
+ "loss": 0.3358,
190
+ "step": 220
191
+ },
192
+ {
193
+ "epoch": 3.3576642335766422,
194
+ "grad_norm": 4.033535957336426,
195
+ "learning_rate": 2.873831775700935e-05,
196
+ "loss": 0.3398,
197
+ "step": 230
198
+ },
199
+ {
200
+ "epoch": 3.5036496350364965,
201
+ "grad_norm": 4.510129928588867,
202
+ "learning_rate": 2.7570093457943924e-05,
203
+ "loss": 0.3628,
204
+ "step": 240
205
+ },
206
+ {
207
+ "epoch": 3.6496350364963503,
208
+ "grad_norm": 3.0796680450439453,
209
+ "learning_rate": 2.6401869158878506e-05,
210
+ "loss": 0.3171,
211
+ "step": 250
212
+ },
213
+ {
214
+ "epoch": 3.795620437956204,
215
+ "grad_norm": 4.170633316040039,
216
+ "learning_rate": 2.5233644859813084e-05,
217
+ "loss": 0.3299,
218
+ "step": 260
219
+ },
220
+ {
221
+ "epoch": 3.9416058394160585,
222
+ "grad_norm": 9.109073638916016,
223
+ "learning_rate": 2.4065420560747666e-05,
224
+ "loss": 0.3365,
225
+ "step": 270
226
+ },
227
+ {
228
+ "epoch": 4.0,
229
+ "eval_accuracy": 0.8700435480174192,
230
+ "eval_loss": 0.3332568407058716,
231
+ "eval_runtime": 36.1676,
232
+ "eval_samples_per_second": 120.633,
233
+ "eval_steps_per_second": 1.908,
234
+ "step": 274
235
+ },
236
+ {
237
+ "epoch": 4.087591240875913,
238
+ "grad_norm": 4.610809803009033,
239
+ "learning_rate": 2.2897196261682244e-05,
240
+ "loss": 0.3744,
241
+ "step": 280
242
+ },
243
+ {
244
+ "epoch": 4.233576642335766,
245
+ "grad_norm": 4.210699558258057,
246
+ "learning_rate": 2.1728971962616822e-05,
247
+ "loss": 0.3022,
248
+ "step": 290
249
+ },
250
+ {
251
+ "epoch": 4.37956204379562,
252
+ "grad_norm": 4.85805082321167,
253
+ "learning_rate": 2.05607476635514e-05,
254
+ "loss": 0.2934,
255
+ "step": 300
256
+ },
257
+ {
258
+ "epoch": 4.525547445255475,
259
+ "grad_norm": 3.4125349521636963,
260
+ "learning_rate": 1.9392523364485982e-05,
261
+ "loss": 0.312,
262
+ "step": 310
263
+ },
264
+ {
265
+ "epoch": 4.671532846715328,
266
+ "grad_norm": 4.196589946746826,
267
+ "learning_rate": 1.822429906542056e-05,
268
+ "loss": 0.2963,
269
+ "step": 320
270
+ },
271
+ {
272
+ "epoch": 4.817518248175182,
273
+ "grad_norm": 3.81192684173584,
274
+ "learning_rate": 1.705607476635514e-05,
275
+ "loss": 0.3019,
276
+ "step": 330
277
+ },
278
+ {
279
+ "epoch": 4.963503649635037,
280
+ "grad_norm": 3.5110998153686523,
281
+ "learning_rate": 1.588785046728972e-05,
282
+ "loss": 0.2976,
283
+ "step": 340
284
+ },
285
+ {
286
+ "epoch": 4.992700729927007,
287
+ "eval_accuracy": 0.8837955535182214,
288
+ "eval_loss": 0.30171430110931396,
289
+ "eval_runtime": 35.5004,
290
+ "eval_samples_per_second": 122.9,
291
+ "eval_steps_per_second": 1.944,
292
+ "step": 342
293
+ },
294
+ {
295
+ "epoch": 5.109489051094891,
296
+ "grad_norm": 6.99758768081665,
297
+ "learning_rate": 1.4719626168224299e-05,
298
+ "loss": 0.259,
299
+ "step": 350
300
+ },
301
+ {
302
+ "epoch": 5.255474452554744,
303
+ "grad_norm": 4.643028736114502,
304
+ "learning_rate": 1.3551401869158877e-05,
305
+ "loss": 0.2668,
306
+ "step": 360
307
+ },
308
+ {
309
+ "epoch": 5.401459854014599,
310
+ "grad_norm": 3.8736965656280518,
311
+ "learning_rate": 1.2383177570093459e-05,
312
+ "loss": 0.278,
313
+ "step": 370
314
+ },
315
+ {
316
+ "epoch": 5.547445255474453,
317
+ "grad_norm": 5.259199142456055,
318
+ "learning_rate": 1.1214953271028037e-05,
319
+ "loss": 0.2677,
320
+ "step": 380
321
+ },
322
+ {
323
+ "epoch": 5.693430656934306,
324
+ "grad_norm": 3.9390275478363037,
325
+ "learning_rate": 1.0046728971962617e-05,
326
+ "loss": 0.2664,
327
+ "step": 390
328
+ },
329
+ {
330
+ "epoch": 5.839416058394161,
331
+ "grad_norm": 4.5700507164001465,
332
+ "learning_rate": 8.878504672897196e-06,
333
+ "loss": 0.2745,
334
+ "step": 400
335
+ },
336
+ {
337
+ "epoch": 5.985401459854015,
338
+ "grad_norm": 3.543813705444336,
339
+ "learning_rate": 7.710280373831776e-06,
340
+ "loss": 0.2611,
341
+ "step": 410
342
+ },
343
+ {
344
+ "epoch": 6.0,
345
+ "eval_accuracy": 0.8810451524180609,
346
+ "eval_loss": 0.3118920624256134,
347
+ "eval_runtime": 35.1336,
348
+ "eval_samples_per_second": 124.183,
349
+ "eval_steps_per_second": 1.964,
350
+ "step": 411
351
+ },
352
+ {
353
+ "epoch": 6.131386861313868,
354
+ "grad_norm": 4.951327800750732,
355
+ "learning_rate": 6.542056074766355e-06,
356
+ "loss": 0.2515,
357
+ "step": 420
358
+ },
359
+ {
360
+ "epoch": 6.2773722627737225,
361
+ "grad_norm": 9.216889381408691,
362
+ "learning_rate": 5.373831775700935e-06,
363
+ "loss": 0.2588,
364
+ "step": 430
365
+ },
366
+ {
367
+ "epoch": 6.423357664233577,
368
+ "grad_norm": 4.5815606117248535,
369
+ "learning_rate": 4.205607476635514e-06,
370
+ "loss": 0.2531,
371
+ "step": 440
372
+ },
373
+ {
374
+ "epoch": 6.569343065693431,
375
+ "grad_norm": 2.8593881130218506,
376
+ "learning_rate": 3.0373831775700936e-06,
377
+ "loss": 0.2453,
378
+ "step": 450
379
+ },
380
+ {
381
+ "epoch": 6.7153284671532845,
382
+ "grad_norm": 5.8815598487854,
383
+ "learning_rate": 1.8691588785046728e-06,
384
+ "loss": 0.2746,
385
+ "step": 460
386
+ },
387
+ {
388
+ "epoch": 6.861313868613139,
389
+ "grad_norm": 7.535807132720947,
390
+ "learning_rate": 7.009345794392523e-07,
391
+ "loss": 0.255,
392
+ "step": 470
393
+ },
394
+ {
395
+ "epoch": 6.948905109489051,
396
+ "eval_accuracy": 0.8819619527847811,
397
+ "eval_loss": 0.3084806203842163,
398
+ "eval_runtime": 35.4691,
399
+ "eval_samples_per_second": 123.008,
400
+ "eval_steps_per_second": 1.945,
401
+ "step": 476
402
+ },
403
+ {
404
+ "epoch": 6.948905109489051,
405
+ "step": 476,
406
+ "total_flos": 9.517373864500433e+18,
407
+ "train_loss": 0.3870567884765753,
408
+ "train_runtime": 2171.3346,
409
+ "train_samples_per_second": 56.33,
410
+ "train_steps_per_second": 0.219
411
+ }
412
+ ],
413
+ "logging_steps": 10,
414
+ "max_steps": 476,
415
+ "num_input_tokens_seen": 0,
416
+ "num_train_epochs": 7,
417
+ "save_steps": 500,
418
+ "stateful_callbacks": {
419
+ "TrainerControl": {
420
+ "args": {
421
+ "should_epoch_stop": false,
422
+ "should_evaluate": false,
423
+ "should_log": false,
424
+ "should_save": true,
425
+ "should_training_stop": true
426
+ },
427
+ "attributes": {}
428
+ }
429
+ },
430
+ "total_flos": 9.517373864500433e+18,
431
+ "train_batch_size": 64,
432
+ "trial_name": null,
433
+ "trial_params": null
434
+ }