polejowska commited on
Commit
d3dcda9
1 Parent(s): 722e715

End of training

Browse files
Files changed (4) hide show
  1. all_results.json +11 -11
  2. eval_results.json +6 -6
  3. train_results.json +6 -6
  4. trainer_state.json +218 -71
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 4.98,
3
- "eval_accuracy": 0.9775132275132276,
4
- "eval_loss": 0.09184322506189346,
5
- "eval_runtime": 4.8893,
6
- "eval_samples_per_second": 154.623,
7
- "eval_steps_per_second": 4.909,
8
- "total_flos": 5.346226696020296e+17,
9
- "train_loss": 0.37407838611891775,
10
- "train_runtime": 386.1594,
11
- "train_samples_per_second": 55.935,
12
- "train_steps_per_second": 0.427
13
  }
 
1
  {
2
+ "epoch": 9.98,
3
+ "eval_accuracy": 0.9828042328042328,
4
+ "eval_loss": 0.06841638684272766,
5
+ "eval_runtime": 5.801,
6
+ "eval_samples_per_second": 130.321,
7
+ "eval_steps_per_second": 4.137,
8
+ "total_flos": 1.0716320475504968e+18,
9
+ "train_loss": 0.24182906033414783,
10
+ "train_runtime": 827.7733,
11
+ "train_samples_per_second": 52.188,
12
+ "train_steps_per_second": 0.399
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 4.98,
3
- "eval_accuracy": 0.9775132275132276,
4
- "eval_loss": 0.09184322506189346,
5
- "eval_runtime": 4.8893,
6
- "eval_samples_per_second": 154.623,
7
- "eval_steps_per_second": 4.909
8
  }
 
1
  {
2
+ "epoch": 9.98,
3
+ "eval_accuracy": 0.9828042328042328,
4
+ "eval_loss": 0.06841638684272766,
5
+ "eval_runtime": 5.801,
6
+ "eval_samples_per_second": 130.321,
7
+ "eval_steps_per_second": 4.137
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 4.98,
3
- "total_flos": 5.346226696020296e+17,
4
- "train_loss": 0.37407838611891775,
5
- "train_runtime": 386.1594,
6
- "train_samples_per_second": 55.935,
7
- "train_steps_per_second": 0.427
8
  }
 
1
  {
2
+ "epoch": 9.98,
3
+ "total_flos": 1.0716320475504968e+18,
4
+ "train_loss": 0.24182906033414783,
5
+ "train_runtime": 827.7733,
6
+ "train_samples_per_second": 52.188,
7
+ "train_steps_per_second": 0.399
8
  }
trainer_state.json CHANGED
@@ -1,166 +1,313 @@
1
  {
2
- "best_metric": 0.9775132275132276,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-eurosat/checkpoint-165",
4
- "epoch": 4.977777777777778,
5
- "global_step": 165,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.3,
12
- "learning_rate": 2.9411764705882354e-05,
13
- "loss": 2.2557,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.59,
18
- "learning_rate": 4.8986486486486486e-05,
19
- "loss": 1.5384,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.89,
24
- "learning_rate": 4.560810810810811e-05,
25
- "loss": 0.6233,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.98,
30
- "eval_accuracy": 0.91005291005291,
31
- "eval_loss": 0.30006203055381775,
32
- "eval_runtime": 4.7638,
33
- "eval_samples_per_second": 158.696,
34
- "eval_steps_per_second": 5.038,
35
  "step": 33
36
  },
37
  {
38
  "epoch": 1.21,
39
- "learning_rate": 4.222972972972973e-05,
40
- "loss": 0.3829,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 1.5,
45
- "learning_rate": 3.885135135135135e-05,
46
- "loss": 0.2118,
47
  "step": 50
48
  },
49
  {
50
  "epoch": 1.8,
51
- "learning_rate": 3.547297297297297e-05,
52
- "loss": 0.1958,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 1.98,
57
- "eval_accuracy": 0.9642857142857143,
58
- "eval_loss": 0.12865345180034637,
59
- "eval_runtime": 4.9076,
60
- "eval_samples_per_second": 154.047,
61
- "eval_steps_per_second": 4.89,
62
  "step": 66
63
  },
64
  {
65
  "epoch": 2.12,
66
- "learning_rate": 3.20945945945946e-05,
67
- "loss": 0.1691,
68
  "step": 70
69
  },
70
  {
71
  "epoch": 2.41,
72
- "learning_rate": 2.8716216216216217e-05,
73
- "loss": 0.1239,
74
  "step": 80
75
  },
76
  {
77
  "epoch": 2.71,
78
- "learning_rate": 2.533783783783784e-05,
79
- "loss": 0.1212,
80
  "step": 90
81
  },
82
  {
83
  "epoch": 2.98,
84
- "eval_accuracy": 0.9708994708994709,
85
- "eval_loss": 0.11089407652616501,
86
- "eval_runtime": 4.7941,
87
- "eval_samples_per_second": 157.693,
88
- "eval_steps_per_second": 5.006,
89
  "step": 99
90
  },
91
  {
92
  "epoch": 3.03,
93
- "learning_rate": 2.195945945945946e-05,
94
- "loss": 0.1071,
95
  "step": 100
96
  },
97
  {
98
  "epoch": 3.33,
99
- "learning_rate": 1.8581081081081082e-05,
100
- "loss": 0.0814,
101
  "step": 110
102
  },
103
  {
104
  "epoch": 3.62,
105
- "learning_rate": 1.5202702702702704e-05,
106
- "loss": 0.0962,
107
  "step": 120
108
  },
109
  {
110
  "epoch": 3.92,
111
- "learning_rate": 1.1824324324324325e-05,
112
- "loss": 0.0734,
113
  "step": 130
114
  },
115
  {
116
  "epoch": 3.98,
117
- "eval_accuracy": 0.9642857142857143,
118
- "eval_loss": 0.11790694296360016,
119
- "eval_runtime": 4.8978,
120
- "eval_samples_per_second": 154.355,
121
- "eval_steps_per_second": 4.9,
122
  "step": 132
123
  },
124
  {
125
  "epoch": 4.24,
126
- "learning_rate": 8.445945945945946e-06,
127
- "loss": 0.0679,
128
  "step": 140
129
  },
130
  {
131
  "epoch": 4.53,
132
- "learning_rate": 5.067567567567568e-06,
133
- "loss": 0.0516,
134
  "step": 150
135
  },
136
  {
137
  "epoch": 4.83,
138
- "learning_rate": 1.6891891891891894e-06,
139
- "loss": 0.0457,
140
  "step": 160
141
  },
142
  {
143
  "epoch": 4.98,
144
- "eval_accuracy": 0.9775132275132276,
145
- "eval_loss": 0.09184322506189346,
146
- "eval_runtime": 4.7828,
147
- "eval_samples_per_second": 158.066,
148
- "eval_steps_per_second": 5.018,
149
  "step": 165
150
  },
151
  {
152
- "epoch": 4.98,
153
- "step": 165,
154
- "total_flos": 5.346226696020296e+17,
155
- "train_loss": 0.37407838611891775,
156
- "train_runtime": 386.1594,
157
- "train_samples_per_second": 55.935,
158
- "train_steps_per_second": 0.427
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
159
  }
160
  ],
161
- "max_steps": 165,
162
- "num_train_epochs": 5,
163
- "total_flos": 5.346226696020296e+17,
164
  "trial_name": null,
165
  "trial_params": null
166
  }
 
1
  {
2
+ "best_metric": 0.9828042328042328,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-eurosat/checkpoint-297",
4
+ "epoch": 9.977777777777778,
5
+ "global_step": 330,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.3,
12
+ "learning_rate": 1.5151515151515153e-05,
13
+ "loss": 2.3574,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.59,
18
+ "learning_rate": 3.0303030303030306e-05,
19
+ "loss": 1.981,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.89,
24
+ "learning_rate": 4.545454545454546e-05,
25
+ "loss": 1.2075,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.98,
30
+ "eval_accuracy": 0.8518518518518519,
31
+ "eval_loss": 0.5666351914405823,
32
+ "eval_runtime": 4.8236,
33
+ "eval_samples_per_second": 156.731,
34
+ "eval_steps_per_second": 4.976,
35
  "step": 33
36
  },
37
  {
38
  "epoch": 1.21,
39
+ "learning_rate": 4.882154882154882e-05,
40
+ "loss": 0.5066,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 1.5,
45
+ "learning_rate": 4.713804713804714e-05,
46
+ "loss": 0.2643,
47
  "step": 50
48
  },
49
  {
50
  "epoch": 1.8,
51
+ "learning_rate": 4.545454545454546e-05,
52
+ "loss": 0.2022,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 1.98,
57
+ "eval_accuracy": 0.9126984126984127,
58
+ "eval_loss": 0.252269446849823,
59
+ "eval_runtime": 4.9657,
60
+ "eval_samples_per_second": 152.245,
61
+ "eval_steps_per_second": 4.833,
62
  "step": 66
63
  },
64
  {
65
  "epoch": 2.12,
66
+ "learning_rate": 4.3771043771043774e-05,
67
+ "loss": 0.1839,
68
  "step": 70
69
  },
70
  {
71
  "epoch": 2.41,
72
+ "learning_rate": 4.208754208754209e-05,
73
+ "loss": 0.1368,
74
  "step": 80
75
  },
76
  {
77
  "epoch": 2.71,
78
+ "learning_rate": 4.0404040404040405e-05,
79
+ "loss": 0.1206,
80
  "step": 90
81
  },
82
  {
83
  "epoch": 2.98,
84
+ "eval_accuracy": 0.9497354497354498,
85
+ "eval_loss": 0.15757465362548828,
86
+ "eval_runtime": 4.8701,
87
+ "eval_samples_per_second": 155.233,
88
+ "eval_steps_per_second": 4.928,
89
  "step": 99
90
  },
91
  {
92
  "epoch": 3.03,
93
+ "learning_rate": 3.872053872053872e-05,
94
+ "loss": 0.105,
95
  "step": 100
96
  },
97
  {
98
  "epoch": 3.33,
99
+ "learning_rate": 3.7037037037037037e-05,
100
+ "loss": 0.0922,
101
  "step": 110
102
  },
103
  {
104
  "epoch": 3.62,
105
+ "learning_rate": 3.535353535353535e-05,
106
+ "loss": 0.0925,
107
  "step": 120
108
  },
109
  {
110
  "epoch": 3.92,
111
+ "learning_rate": 3.3670033670033675e-05,
112
+ "loss": 0.0897,
113
  "step": 130
114
  },
115
  {
116
  "epoch": 3.98,
117
+ "eval_accuracy": 0.9563492063492064,
118
+ "eval_loss": 0.142096146941185,
119
+ "eval_runtime": 6.3572,
120
+ "eval_samples_per_second": 118.921,
121
+ "eval_steps_per_second": 3.775,
122
  "step": 132
123
  },
124
  {
125
  "epoch": 4.24,
126
+ "learning_rate": 3.198653198653199e-05,
127
+ "loss": 0.0704,
128
  "step": 140
129
  },
130
  {
131
  "epoch": 4.53,
132
+ "learning_rate": 3.0303030303030306e-05,
133
+ "loss": 0.0511,
134
  "step": 150
135
  },
136
  {
137
  "epoch": 4.83,
138
+ "learning_rate": 2.8619528619528618e-05,
139
+ "loss": 0.0564,
140
  "step": 160
141
  },
142
  {
143
  "epoch": 4.98,
144
+ "eval_accuracy": 0.9656084656084656,
145
+ "eval_loss": 0.11138752847909927,
146
+ "eval_runtime": 5.5251,
147
+ "eval_samples_per_second": 136.831,
148
+ "eval_steps_per_second": 4.344,
149
  "step": 165
150
  },
151
  {
152
+ "epoch": 5.15,
153
+ "learning_rate": 2.6936026936026937e-05,
154
+ "loss": 0.0559,
155
+ "step": 170
156
+ },
157
+ {
158
+ "epoch": 5.44,
159
+ "learning_rate": 2.5252525252525256e-05,
160
+ "loss": 0.0468,
161
+ "step": 180
162
+ },
163
+ {
164
+ "epoch": 5.74,
165
+ "learning_rate": 2.356902356902357e-05,
166
+ "loss": 0.0475,
167
+ "step": 190
168
+ },
169
+ {
170
+ "epoch": 5.98,
171
+ "eval_accuracy": 0.9814814814814815,
172
+ "eval_loss": 0.06781856715679169,
173
+ "eval_runtime": 5.3143,
174
+ "eval_samples_per_second": 142.259,
175
+ "eval_steps_per_second": 4.516,
176
+ "step": 198
177
+ },
178
+ {
179
+ "epoch": 6.06,
180
+ "learning_rate": 2.1885521885521887e-05,
181
+ "loss": 0.0514,
182
+ "step": 200
183
+ },
184
+ {
185
+ "epoch": 6.36,
186
+ "learning_rate": 2.0202020202020203e-05,
187
+ "loss": 0.0237,
188
+ "step": 210
189
+ },
190
+ {
191
+ "epoch": 6.65,
192
+ "learning_rate": 1.8518518518518518e-05,
193
+ "loss": 0.0255,
194
+ "step": 220
195
+ },
196
+ {
197
+ "epoch": 6.95,
198
+ "learning_rate": 1.6835016835016837e-05,
199
+ "loss": 0.0332,
200
+ "step": 230
201
+ },
202
+ {
203
+ "epoch": 6.98,
204
+ "eval_accuracy": 0.9775132275132276,
205
+ "eval_loss": 0.08194286376237869,
206
+ "eval_runtime": 5.0836,
207
+ "eval_samples_per_second": 148.714,
208
+ "eval_steps_per_second": 4.721,
209
+ "step": 231
210
+ },
211
+ {
212
+ "epoch": 7.27,
213
+ "learning_rate": 1.5151515151515153e-05,
214
+ "loss": 0.0263,
215
+ "step": 240
216
+ },
217
+ {
218
+ "epoch": 7.56,
219
+ "learning_rate": 1.3468013468013468e-05,
220
+ "loss": 0.0193,
221
+ "step": 250
222
+ },
223
+ {
224
+ "epoch": 7.86,
225
+ "learning_rate": 1.1784511784511786e-05,
226
+ "loss": 0.0234,
227
+ "step": 260
228
+ },
229
+ {
230
+ "epoch": 7.98,
231
+ "eval_accuracy": 0.9801587301587301,
232
+ "eval_loss": 0.06791768968105316,
233
+ "eval_runtime": 5.0567,
234
+ "eval_samples_per_second": 149.505,
235
+ "eval_steps_per_second": 4.746,
236
+ "step": 264
237
+ },
238
+ {
239
+ "epoch": 8.18,
240
+ "learning_rate": 1.0101010101010101e-05,
241
+ "loss": 0.0193,
242
+ "step": 270
243
+ },
244
+ {
245
+ "epoch": 8.47,
246
+ "learning_rate": 8.417508417508419e-06,
247
+ "loss": 0.0151,
248
+ "step": 280
249
+ },
250
+ {
251
+ "epoch": 8.77,
252
+ "learning_rate": 6.734006734006734e-06,
253
+ "loss": 0.0126,
254
+ "step": 290
255
+ },
256
+ {
257
+ "epoch": 8.98,
258
+ "eval_accuracy": 0.9828042328042328,
259
+ "eval_loss": 0.06841638684272766,
260
+ "eval_runtime": 4.8183,
261
+ "eval_samples_per_second": 156.902,
262
+ "eval_steps_per_second": 4.981,
263
+ "step": 297
264
+ },
265
+ {
266
+ "epoch": 9.09,
267
+ "learning_rate": 5.050505050505051e-06,
268
+ "loss": 0.0096,
269
+ "step": 300
270
+ },
271
+ {
272
+ "epoch": 9.39,
273
+ "learning_rate": 3.367003367003367e-06,
274
+ "loss": 0.0091,
275
+ "step": 310
276
+ },
277
+ {
278
+ "epoch": 9.68,
279
+ "learning_rate": 1.6835016835016836e-06,
280
+ "loss": 0.0136,
281
+ "step": 320
282
+ },
283
+ {
284
+ "epoch": 9.98,
285
+ "learning_rate": 0.0,
286
+ "loss": 0.0306,
287
+ "step": 330
288
+ },
289
+ {
290
+ "epoch": 9.98,
291
+ "eval_accuracy": 0.9814814814814815,
292
+ "eval_loss": 0.07185560464859009,
293
+ "eval_runtime": 6.808,
294
+ "eval_samples_per_second": 111.046,
295
+ "eval_steps_per_second": 3.525,
296
+ "step": 330
297
+ },
298
+ {
299
+ "epoch": 9.98,
300
+ "step": 330,
301
+ "total_flos": 1.0716320475504968e+18,
302
+ "train_loss": 0.24182906033414783,
303
+ "train_runtime": 827.7733,
304
+ "train_samples_per_second": 52.188,
305
+ "train_steps_per_second": 0.399
306
  }
307
  ],
308
+ "max_steps": 330,
309
+ "num_train_epochs": 10,
310
+ "total_flos": 1.0716320475504968e+18,
311
  "trial_name": null,
312
  "trial_params": null
313
  }