Augusto777 commited on
Commit
3998b2a
1 Parent(s): 748fbc6

End of training

Browse files
README.md CHANGED
@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [microsoft/swin-tiny-patch4-window7-224](https://huggingface.co/microsoft/swin-tiny-patch4-window7-224) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.3035
21
- - Accuracy: 0.8793
22
 
23
  ## Model description
24
 
 
17
 
18
  This model is a fine-tuned version of [microsoft/swin-tiny-patch4-window7-224](https://huggingface.co/microsoft/swin-tiny-patch4-window7-224) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.3718
21
+ - Accuracy: 0.8966
22
 
23
  ## Model description
24
 
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 37.65,
3
+ "eval_accuracy": 0.896551724137931,
4
+ "eval_loss": 0.3717654049396515,
5
+ "eval_runtime": 0.6072,
6
+ "eval_samples_per_second": 95.521,
7
+ "eval_steps_per_second": 3.294,
8
+ "total_flos": 4.870057509170381e+17,
9
+ "train_loss": 0.5200165078043938,
10
+ "train_runtime": 456.0431,
11
+ "train_samples_per_second": 45.61,
12
+ "train_steps_per_second": 0.351
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 37.65,
3
+ "eval_accuracy": 0.896551724137931,
4
+ "eval_loss": 0.3717654049396515,
5
+ "eval_runtime": 0.6072,
6
+ "eval_samples_per_second": 95.521,
7
+ "eval_steps_per_second": 3.294
8
+ }
runs/Dec05_23-14-42_2e18f523b17c/events.out.tfevents.1701818581.2e18f523b17c.3067.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33793eb5623af834896cf2a2d62087852de48c71ca53564b07fd56aa1ab2a832
3
+ size 411
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 37.65,
3
+ "total_flos": 4.870057509170381e+17,
4
+ "train_loss": 0.5200165078043938,
5
+ "train_runtime": 456.0431,
6
+ "train_samples_per_second": 45.61,
7
+ "train_steps_per_second": 0.351
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,466 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.896551724137931,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-dmae-va-da2-40/checkpoint-110",
4
+ "epoch": 37.64705882352941,
5
+ "eval_steps": 500,
6
+ "global_step": 160,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.94,
13
+ "eval_accuracy": 0.3620689655172414,
14
+ "eval_loss": 1.3102844953536987,
15
+ "eval_runtime": 0.5859,
16
+ "eval_samples_per_second": 99.0,
17
+ "eval_steps_per_second": 3.414,
18
+ "step": 4
19
+ },
20
+ {
21
+ "epoch": 1.88,
22
+ "eval_accuracy": 0.3275862068965517,
23
+ "eval_loss": 1.2844481468200684,
24
+ "eval_runtime": 0.541,
25
+ "eval_samples_per_second": 107.217,
26
+ "eval_steps_per_second": 3.697,
27
+ "step": 8
28
+ },
29
+ {
30
+ "epoch": 2.35,
31
+ "learning_rate": 3.125e-05,
32
+ "loss": 1.3144,
33
+ "step": 10
34
+ },
35
+ {
36
+ "epoch": 2.82,
37
+ "eval_accuracy": 0.41379310344827586,
38
+ "eval_loss": 1.2574777603149414,
39
+ "eval_runtime": 0.5361,
40
+ "eval_samples_per_second": 108.186,
41
+ "eval_steps_per_second": 3.731,
42
+ "step": 12
43
+ },
44
+ {
45
+ "epoch": 4.0,
46
+ "eval_accuracy": 0.5,
47
+ "eval_loss": 1.1180709600448608,
48
+ "eval_runtime": 0.5531,
49
+ "eval_samples_per_second": 104.867,
50
+ "eval_steps_per_second": 3.616,
51
+ "step": 17
52
+ },
53
+ {
54
+ "epoch": 4.71,
55
+ "learning_rate": 4.8611111111111115e-05,
56
+ "loss": 1.1723,
57
+ "step": 20
58
+ },
59
+ {
60
+ "epoch": 4.94,
61
+ "eval_accuracy": 0.5344827586206896,
62
+ "eval_loss": 1.0054141283035278,
63
+ "eval_runtime": 0.7262,
64
+ "eval_samples_per_second": 79.866,
65
+ "eval_steps_per_second": 2.754,
66
+ "step": 21
67
+ },
68
+ {
69
+ "epoch": 5.88,
70
+ "eval_accuracy": 0.5689655172413793,
71
+ "eval_loss": 0.8771402835845947,
72
+ "eval_runtime": 0.632,
73
+ "eval_samples_per_second": 91.766,
74
+ "eval_steps_per_second": 3.164,
75
+ "step": 25
76
+ },
77
+ {
78
+ "epoch": 6.82,
79
+ "eval_accuracy": 0.7068965517241379,
80
+ "eval_loss": 0.794106125831604,
81
+ "eval_runtime": 0.5449,
82
+ "eval_samples_per_second": 106.436,
83
+ "eval_steps_per_second": 3.67,
84
+ "step": 29
85
+ },
86
+ {
87
+ "epoch": 7.06,
88
+ "learning_rate": 4.5138888888888894e-05,
89
+ "loss": 0.9243,
90
+ "step": 30
91
+ },
92
+ {
93
+ "epoch": 8.0,
94
+ "eval_accuracy": 0.6724137931034483,
95
+ "eval_loss": 0.7037971615791321,
96
+ "eval_runtime": 0.5421,
97
+ "eval_samples_per_second": 106.985,
98
+ "eval_steps_per_second": 3.689,
99
+ "step": 34
100
+ },
101
+ {
102
+ "epoch": 8.94,
103
+ "eval_accuracy": 0.7241379310344828,
104
+ "eval_loss": 0.7341203093528748,
105
+ "eval_runtime": 0.5497,
106
+ "eval_samples_per_second": 105.515,
107
+ "eval_steps_per_second": 3.638,
108
+ "step": 38
109
+ },
110
+ {
111
+ "epoch": 9.41,
112
+ "learning_rate": 4.166666666666667e-05,
113
+ "loss": 0.7394,
114
+ "step": 40
115
+ },
116
+ {
117
+ "epoch": 9.88,
118
+ "eval_accuracy": 0.7413793103448276,
119
+ "eval_loss": 0.6256024837493896,
120
+ "eval_runtime": 0.544,
121
+ "eval_samples_per_second": 106.617,
122
+ "eval_steps_per_second": 3.676,
123
+ "step": 42
124
+ },
125
+ {
126
+ "epoch": 10.82,
127
+ "eval_accuracy": 0.7586206896551724,
128
+ "eval_loss": 0.6058707237243652,
129
+ "eval_runtime": 0.6912,
130
+ "eval_samples_per_second": 83.916,
131
+ "eval_steps_per_second": 2.894,
132
+ "step": 46
133
+ },
134
+ {
135
+ "epoch": 11.76,
136
+ "learning_rate": 3.8194444444444444e-05,
137
+ "loss": 0.627,
138
+ "step": 50
139
+ },
140
+ {
141
+ "epoch": 12.0,
142
+ "eval_accuracy": 0.7413793103448276,
143
+ "eval_loss": 0.5662473440170288,
144
+ "eval_runtime": 0.7222,
145
+ "eval_samples_per_second": 80.313,
146
+ "eval_steps_per_second": 2.769,
147
+ "step": 51
148
+ },
149
+ {
150
+ "epoch": 12.94,
151
+ "eval_accuracy": 0.7931034482758621,
152
+ "eval_loss": 0.5383967757225037,
153
+ "eval_runtime": 0.5429,
154
+ "eval_samples_per_second": 106.842,
155
+ "eval_steps_per_second": 3.684,
156
+ "step": 55
157
+ },
158
+ {
159
+ "epoch": 13.88,
160
+ "eval_accuracy": 0.7758620689655172,
161
+ "eval_loss": 0.5630860328674316,
162
+ "eval_runtime": 0.5402,
163
+ "eval_samples_per_second": 107.371,
164
+ "eval_steps_per_second": 3.702,
165
+ "step": 59
166
+ },
167
+ {
168
+ "epoch": 14.12,
169
+ "learning_rate": 3.472222222222222e-05,
170
+ "loss": 0.5026,
171
+ "step": 60
172
+ },
173
+ {
174
+ "epoch": 14.82,
175
+ "eval_accuracy": 0.8103448275862069,
176
+ "eval_loss": 0.49379998445510864,
177
+ "eval_runtime": 0.5445,
178
+ "eval_samples_per_second": 106.521,
179
+ "eval_steps_per_second": 3.673,
180
+ "step": 63
181
+ },
182
+ {
183
+ "epoch": 16.0,
184
+ "eval_accuracy": 0.8448275862068966,
185
+ "eval_loss": 0.4768355190753937,
186
+ "eval_runtime": 0.5424,
187
+ "eval_samples_per_second": 106.928,
188
+ "eval_steps_per_second": 3.687,
189
+ "step": 68
190
+ },
191
+ {
192
+ "epoch": 16.47,
193
+ "learning_rate": 3.125e-05,
194
+ "loss": 0.4284,
195
+ "step": 70
196
+ },
197
+ {
198
+ "epoch": 16.94,
199
+ "eval_accuracy": 0.8620689655172413,
200
+ "eval_loss": 0.4082733988761902,
201
+ "eval_runtime": 0.5537,
202
+ "eval_samples_per_second": 104.745,
203
+ "eval_steps_per_second": 3.612,
204
+ "step": 72
205
+ },
206
+ {
207
+ "epoch": 17.88,
208
+ "eval_accuracy": 0.8275862068965517,
209
+ "eval_loss": 0.3942280411720276,
210
+ "eval_runtime": 0.5427,
211
+ "eval_samples_per_second": 106.871,
212
+ "eval_steps_per_second": 3.685,
213
+ "step": 76
214
+ },
215
+ {
216
+ "epoch": 18.82,
217
+ "learning_rate": 2.777777777777778e-05,
218
+ "loss": 0.3922,
219
+ "step": 80
220
+ },
221
+ {
222
+ "epoch": 18.82,
223
+ "eval_accuracy": 0.8620689655172413,
224
+ "eval_loss": 0.37597107887268066,
225
+ "eval_runtime": 0.6952,
226
+ "eval_samples_per_second": 83.423,
227
+ "eval_steps_per_second": 2.877,
228
+ "step": 80
229
+ },
230
+ {
231
+ "epoch": 20.0,
232
+ "eval_accuracy": 0.8275862068965517,
233
+ "eval_loss": 0.4109302759170532,
234
+ "eval_runtime": 0.548,
235
+ "eval_samples_per_second": 105.841,
236
+ "eval_steps_per_second": 3.65,
237
+ "step": 85
238
+ },
239
+ {
240
+ "epoch": 20.94,
241
+ "eval_accuracy": 0.8620689655172413,
242
+ "eval_loss": 0.38523542881011963,
243
+ "eval_runtime": 0.5465,
244
+ "eval_samples_per_second": 106.125,
245
+ "eval_steps_per_second": 3.659,
246
+ "step": 89
247
+ },
248
+ {
249
+ "epoch": 21.18,
250
+ "learning_rate": 2.4305555555555558e-05,
251
+ "loss": 0.3927,
252
+ "step": 90
253
+ },
254
+ {
255
+ "epoch": 21.88,
256
+ "eval_accuracy": 0.8620689655172413,
257
+ "eval_loss": 0.3660654127597809,
258
+ "eval_runtime": 0.5512,
259
+ "eval_samples_per_second": 105.229,
260
+ "eval_steps_per_second": 3.629,
261
+ "step": 93
262
+ },
263
+ {
264
+ "epoch": 22.82,
265
+ "eval_accuracy": 0.8793103448275862,
266
+ "eval_loss": 0.3930301368236542,
267
+ "eval_runtime": 0.5482,
268
+ "eval_samples_per_second": 105.792,
269
+ "eval_steps_per_second": 3.648,
270
+ "step": 97
271
+ },
272
+ {
273
+ "epoch": 23.53,
274
+ "learning_rate": 2.0833333333333336e-05,
275
+ "loss": 0.3338,
276
+ "step": 100
277
+ },
278
+ {
279
+ "epoch": 24.0,
280
+ "eval_accuracy": 0.8620689655172413,
281
+ "eval_loss": 0.35855162143707275,
282
+ "eval_runtime": 0.5507,
283
+ "eval_samples_per_second": 105.323,
284
+ "eval_steps_per_second": 3.632,
285
+ "step": 102
286
+ },
287
+ {
288
+ "epoch": 24.94,
289
+ "eval_accuracy": 0.8620689655172413,
290
+ "eval_loss": 0.36067575216293335,
291
+ "eval_runtime": 0.7414,
292
+ "eval_samples_per_second": 78.233,
293
+ "eval_steps_per_second": 2.698,
294
+ "step": 106
295
+ },
296
+ {
297
+ "epoch": 25.88,
298
+ "learning_rate": 1.736111111111111e-05,
299
+ "loss": 0.2698,
300
+ "step": 110
301
+ },
302
+ {
303
+ "epoch": 25.88,
304
+ "eval_accuracy": 0.896551724137931,
305
+ "eval_loss": 0.3717654049396515,
306
+ "eval_runtime": 0.619,
307
+ "eval_samples_per_second": 93.702,
308
+ "eval_steps_per_second": 3.231,
309
+ "step": 110
310
+ },
311
+ {
312
+ "epoch": 26.82,
313
+ "eval_accuracy": 0.8793103448275862,
314
+ "eval_loss": 0.35024696588516235,
315
+ "eval_runtime": 0.5475,
316
+ "eval_samples_per_second": 105.944,
317
+ "eval_steps_per_second": 3.653,
318
+ "step": 114
319
+ },
320
+ {
321
+ "epoch": 28.0,
322
+ "eval_accuracy": 0.8448275862068966,
323
+ "eval_loss": 0.3614311218261719,
324
+ "eval_runtime": 0.5691,
325
+ "eval_samples_per_second": 101.924,
326
+ "eval_steps_per_second": 3.515,
327
+ "step": 119
328
+ },
329
+ {
330
+ "epoch": 28.24,
331
+ "learning_rate": 1.388888888888889e-05,
332
+ "loss": 0.2707,
333
+ "step": 120
334
+ },
335
+ {
336
+ "epoch": 28.94,
337
+ "eval_accuracy": 0.8620689655172413,
338
+ "eval_loss": 0.3537382185459137,
339
+ "eval_runtime": 0.5442,
340
+ "eval_samples_per_second": 106.586,
341
+ "eval_steps_per_second": 3.675,
342
+ "step": 123
343
+ },
344
+ {
345
+ "epoch": 29.88,
346
+ "eval_accuracy": 0.8793103448275862,
347
+ "eval_loss": 0.354471892118454,
348
+ "eval_runtime": 0.5491,
349
+ "eval_samples_per_second": 105.623,
350
+ "eval_steps_per_second": 3.642,
351
+ "step": 127
352
+ },
353
+ {
354
+ "epoch": 30.59,
355
+ "learning_rate": 1.0416666666666668e-05,
356
+ "loss": 0.2622,
357
+ "step": 130
358
+ },
359
+ {
360
+ "epoch": 30.82,
361
+ "eval_accuracy": 0.8793103448275862,
362
+ "eval_loss": 0.32017067074775696,
363
+ "eval_runtime": 0.6084,
364
+ "eval_samples_per_second": 95.331,
365
+ "eval_steps_per_second": 3.287,
366
+ "step": 131
367
+ },
368
+ {
369
+ "epoch": 32.0,
370
+ "eval_accuracy": 0.8793103448275862,
371
+ "eval_loss": 0.3125433623790741,
372
+ "eval_runtime": 0.6933,
373
+ "eval_samples_per_second": 83.663,
374
+ "eval_steps_per_second": 2.885,
375
+ "step": 136
376
+ },
377
+ {
378
+ "epoch": 32.94,
379
+ "learning_rate": 6.944444444444445e-06,
380
+ "loss": 0.2499,
381
+ "step": 140
382
+ },
383
+ {
384
+ "epoch": 32.94,
385
+ "eval_accuracy": 0.8620689655172413,
386
+ "eval_loss": 0.3215100169181824,
387
+ "eval_runtime": 0.5383,
388
+ "eval_samples_per_second": 107.744,
389
+ "eval_steps_per_second": 3.715,
390
+ "step": 140
391
+ },
392
+ {
393
+ "epoch": 33.88,
394
+ "eval_accuracy": 0.8620689655172413,
395
+ "eval_loss": 0.3194180428981781,
396
+ "eval_runtime": 0.5395,
397
+ "eval_samples_per_second": 107.502,
398
+ "eval_steps_per_second": 3.707,
399
+ "step": 144
400
+ },
401
+ {
402
+ "epoch": 34.82,
403
+ "eval_accuracy": 0.8793103448275862,
404
+ "eval_loss": 0.3065814971923828,
405
+ "eval_runtime": 0.5319,
406
+ "eval_samples_per_second": 109.036,
407
+ "eval_steps_per_second": 3.76,
408
+ "step": 148
409
+ },
410
+ {
411
+ "epoch": 35.29,
412
+ "learning_rate": 3.4722222222222224e-06,
413
+ "loss": 0.2157,
414
+ "step": 150
415
+ },
416
+ {
417
+ "epoch": 36.0,
418
+ "eval_accuracy": 0.8793103448275862,
419
+ "eval_loss": 0.3023557662963867,
420
+ "eval_runtime": 0.5521,
421
+ "eval_samples_per_second": 105.047,
422
+ "eval_steps_per_second": 3.622,
423
+ "step": 153
424
+ },
425
+ {
426
+ "epoch": 36.94,
427
+ "eval_accuracy": 0.8793103448275862,
428
+ "eval_loss": 0.30368945002555847,
429
+ "eval_runtime": 0.5271,
430
+ "eval_samples_per_second": 110.045,
431
+ "eval_steps_per_second": 3.795,
432
+ "step": 157
433
+ },
434
+ {
435
+ "epoch": 37.65,
436
+ "learning_rate": 0.0,
437
+ "loss": 0.2248,
438
+ "step": 160
439
+ },
440
+ {
441
+ "epoch": 37.65,
442
+ "eval_accuracy": 0.8793103448275862,
443
+ "eval_loss": 0.303451269865036,
444
+ "eval_runtime": 0.5525,
445
+ "eval_samples_per_second": 104.979,
446
+ "eval_steps_per_second": 3.62,
447
+ "step": 160
448
+ },
449
+ {
450
+ "epoch": 37.65,
451
+ "step": 160,
452
+ "total_flos": 4.870057509170381e+17,
453
+ "train_loss": 0.5200165078043938,
454
+ "train_runtime": 456.0431,
455
+ "train_samples_per_second": 45.61,
456
+ "train_steps_per_second": 0.351
457
+ }
458
+ ],
459
+ "logging_steps": 10,
460
+ "max_steps": 160,
461
+ "num_train_epochs": 40,
462
+ "save_steps": 500,
463
+ "total_flos": 4.870057509170381e+17,
464
+ "trial_name": null,
465
+ "trial_params": null
466
+ }