ZivKassnerNK commited on
Commit
32d2344
·
1 Parent(s): 043ae68

Add evaluation results and output files to model card

Browse files
README.md CHANGED
@@ -5,16 +5,19 @@ tags:
5
  - model
6
  - evaluation
7
  metrics:
8
- - average_precision: 0.98
9
- - roc_auc: 0.98
 
10
  ---
11
 
12
  # Binary Classification Model
13
 
14
  ## Evaluation Results
15
 
16
- **Average Precision:** 0.98
17
- **ROC AUC:** 0.98
 
 
18
 
19
  ## Visualizations
20
 
 
5
  - model
6
  - evaluation
7
  metrics:
8
+ - average_precision: 0.69
9
+ - roc_auc: 0.80
10
+ - best threshold according to F1: 0.49
11
  ---
12
 
13
  # Binary Classification Model
14
 
15
  ## Evaluation Results
16
 
17
+ **Average Precision:** 0.69
18
+ **ROC AUC:** 0.80
19
+ **best threshold according to F1: 0.49
20
+
21
 
22
  ## Visualizations
23
 
checkpoint-60/config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "ZivKassnerNK/binary_classification_model_v3.1.3_spines",
3
+ "architectures": [
4
+ "ViTForImageClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "encoder_stride": 16,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.0,
10
+ "hidden_size": 256,
11
+ "image_size": 32,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 512,
14
+ "layer_norm_eps": 1e-12,
15
+ "model_type": "vit",
16
+ "num_attention_heads": 8,
17
+ "num_channels": 3,
18
+ "num_hidden_layers": 4,
19
+ "patch_size": 4,
20
+ "qkv_bias": true,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.46.2"
23
+ }
checkpoint-60/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15c3e4eadac387d483c826c1b623a2d3556ddc29b917fb4af6ac56d20f6bc19a
3
+ size 8563512
checkpoint-60/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:199a160bf7c2384f9978abcd0839d2e41a02de869543a5cf1b9e930265ba8cba
3
+ size 17153530
checkpoint-60/preprocessor_config.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "do_rescale": true,
4
+ "do_resize": false,
5
+ "image_mean": [
6
+ 0.5,
7
+ 0.5,
8
+ 0.5
9
+ ],
10
+ "image_processor_type": "ViTFeatureExtractor",
11
+ "image_std": [
12
+ 0.5,
13
+ 0.5,
14
+ 0.5
15
+ ],
16
+ "resample": 2,
17
+ "rescale_factor": 0.00392156862745098,
18
+ "size": {
19
+ "height": 32,
20
+ "width": 32
21
+ }
22
+ }
checkpoint-60/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7083fc19c48bbb45c07abf88c54fd55da4575c8de4143ad56fb803aa19e03e1c
3
+ size 14244
checkpoint-60/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe62f9b4684e8fb0c29de8f793bdd1b8fa855b987b0ead0080529f92de69f770
3
+ size 1000
checkpoint-60/trainer_state.json ADDED
@@ -0,0 +1,633 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.8018098205014093,
3
+ "best_model_checkpoint": "/tmp/logs/binary_classification_model_v3.1.3_spines/checkpoint-60",
4
+ "epoch": 15.0,
5
+ "eval_steps": 500,
6
+ "global_step": 60,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.25,
13
+ "grad_norm": 274159.65625,
14
+ "learning_rate": 1.605445671718469e-07,
15
+ "loss": 0.4196,
16
+ "step": 1
17
+ },
18
+ {
19
+ "epoch": 0.5,
20
+ "grad_norm": 123727.359375,
21
+ "learning_rate": 3.210891343436938e-07,
22
+ "loss": 0.4092,
23
+ "step": 2
24
+ },
25
+ {
26
+ "epoch": 0.75,
27
+ "grad_norm": 222667.140625,
28
+ "learning_rate": 4.816337015155407e-07,
29
+ "loss": 0.4168,
30
+ "step": 3
31
+ },
32
+ {
33
+ "epoch": 1.0,
34
+ "grad_norm": 209992.453125,
35
+ "learning_rate": 6.421782686873876e-07,
36
+ "loss": 0.4225,
37
+ "step": 4
38
+ },
39
+ {
40
+ "epoch": 1.0,
41
+ "eval_accuracy": 0.7976561341047322,
42
+ "eval_f1": 0.7792165749433474,
43
+ "eval_loss": 0.41963040828704834,
44
+ "eval_precision": 0.795702479338843,
45
+ "eval_recall": 0.7633999365683476,
46
+ "eval_runtime": 3.391,
47
+ "eval_samples_per_second": 1987.931,
48
+ "eval_steps_per_second": 1.18,
49
+ "step": 4
50
+ },
51
+ {
52
+ "epoch": 1.25,
53
+ "grad_norm": 109456.3203125,
54
+ "learning_rate": 8.027228358592346e-07,
55
+ "loss": 0.4175,
56
+ "step": 5
57
+ },
58
+ {
59
+ "epoch": 1.5,
60
+ "grad_norm": 263527.1875,
61
+ "learning_rate": 9.632674030310814e-07,
62
+ "loss": 0.4227,
63
+ "step": 6
64
+ },
65
+ {
66
+ "epoch": 1.75,
67
+ "grad_norm": 201531.734375,
68
+ "learning_rate": 1.1238119702029283e-06,
69
+ "loss": 0.4214,
70
+ "step": 7
71
+ },
72
+ {
73
+ "epoch": 2.0,
74
+ "grad_norm": 185288.390625,
75
+ "learning_rate": 1.2843565373747752e-06,
76
+ "loss": 0.4262,
77
+ "step": 8
78
+ },
79
+ {
80
+ "epoch": 2.0,
81
+ "eval_accuracy": 0.7937991395935321,
82
+ "eval_f1": 0.7719067935674434,
83
+ "eval_loss": 0.4199751019477844,
84
+ "eval_precision": 0.7997279836790208,
85
+ "eval_recall": 0.7459562321598477,
86
+ "eval_runtime": 3.5857,
87
+ "eval_samples_per_second": 1879.992,
88
+ "eval_steps_per_second": 1.116,
89
+ "step": 8
90
+ },
91
+ {
92
+ "epoch": 2.25,
93
+ "grad_norm": 155418.6875,
94
+ "learning_rate": 1.444901104546622e-06,
95
+ "loss": 0.4239,
96
+ "step": 9
97
+ },
98
+ {
99
+ "epoch": 2.5,
100
+ "grad_norm": 57884.13671875,
101
+ "learning_rate": 1.6054456717184691e-06,
102
+ "loss": 0.4192,
103
+ "step": 10
104
+ },
105
+ {
106
+ "epoch": 2.75,
107
+ "grad_norm": 67545.6796875,
108
+ "learning_rate": 1.765990238890316e-06,
109
+ "loss": 0.4241,
110
+ "step": 11
111
+ },
112
+ {
113
+ "epoch": 3.0,
114
+ "grad_norm": 205635.140625,
115
+ "learning_rate": 1.926534806062163e-06,
116
+ "loss": 0.4239,
117
+ "step": 12
118
+ },
119
+ {
120
+ "epoch": 3.0,
121
+ "eval_accuracy": 0.79884290164664,
122
+ "eval_f1": 0.7818532818532818,
123
+ "eval_loss": 0.42012614011764526,
124
+ "eval_precision": 0.7933398628795298,
125
+ "eval_recall": 0.7706945765937203,
126
+ "eval_runtime": 3.6476,
127
+ "eval_samples_per_second": 1848.072,
128
+ "eval_steps_per_second": 1.097,
129
+ "step": 12
130
+ },
131
+ {
132
+ "epoch": 3.25,
133
+ "grad_norm": 330362.96875,
134
+ "learning_rate": 2.0870793732340097e-06,
135
+ "loss": 0.4369,
136
+ "step": 13
137
+ },
138
+ {
139
+ "epoch": 3.5,
140
+ "grad_norm": 340636.6875,
141
+ "learning_rate": 2.2476239404058566e-06,
142
+ "loss": 0.4186,
143
+ "step": 14
144
+ },
145
+ {
146
+ "epoch": 3.75,
147
+ "grad_norm": 224574.828125,
148
+ "learning_rate": 2.408168507577704e-06,
149
+ "loss": 0.4217,
150
+ "step": 15
151
+ },
152
+ {
153
+ "epoch": 4.0,
154
+ "grad_norm": 234618.53125,
155
+ "learning_rate": 2.5687130747495503e-06,
156
+ "loss": 0.397,
157
+ "step": 16
158
+ },
159
+ {
160
+ "epoch": 4.0,
161
+ "eval_accuracy": 0.7969144043910399,
162
+ "eval_f1": 0.7780119993513864,
163
+ "eval_loss": 0.4202006161212921,
164
+ "eval_precision": 0.7959522229595223,
165
+ "eval_recall": 0.7608626704725658,
166
+ "eval_runtime": 3.7223,
167
+ "eval_samples_per_second": 1810.979,
168
+ "eval_steps_per_second": 1.075,
169
+ "step": 16
170
+ },
171
+ {
172
+ "epoch": 4.25,
173
+ "grad_norm": 214805.421875,
174
+ "learning_rate": 2.729257641921397e-06,
175
+ "loss": 0.4257,
176
+ "step": 17
177
+ },
178
+ {
179
+ "epoch": 4.5,
180
+ "grad_norm": 193107.890625,
181
+ "learning_rate": 2.889802209093244e-06,
182
+ "loss": 0.421,
183
+ "step": 18
184
+ },
185
+ {
186
+ "epoch": 4.75,
187
+ "grad_norm": 185903.40625,
188
+ "learning_rate": 3.0503467762650913e-06,
189
+ "loss": 0.4226,
190
+ "step": 19
191
+ },
192
+ {
193
+ "epoch": 5.0,
194
+ "grad_norm": 146775.96875,
195
+ "learning_rate": 3.2108913434369382e-06,
196
+ "loss": 0.4049,
197
+ "step": 20
198
+ },
199
+ {
200
+ "epoch": 5.0,
201
+ "eval_accuracy": 0.7930574098798397,
202
+ "eval_f1": 0.7698399604025739,
203
+ "eval_loss": 0.4199390411376953,
204
+ "eval_precision": 0.8022696011004127,
205
+ "eval_recall": 0.739930225182366,
206
+ "eval_runtime": 3.7358,
207
+ "eval_samples_per_second": 1804.441,
208
+ "eval_steps_per_second": 1.071,
209
+ "step": 20
210
+ },
211
+ {
212
+ "epoch": 5.25,
213
+ "grad_norm": 193645.421875,
214
+ "learning_rate": 3.371435910608785e-06,
215
+ "loss": 0.4233,
216
+ "step": 21
217
+ },
218
+ {
219
+ "epoch": 5.5,
220
+ "grad_norm": 626666.875,
221
+ "learning_rate": 3.531980477780632e-06,
222
+ "loss": 0.421,
223
+ "step": 22
224
+ },
225
+ {
226
+ "epoch": 5.75,
227
+ "grad_norm": 317973.40625,
228
+ "learning_rate": 3.692525044952479e-06,
229
+ "loss": 0.4353,
230
+ "step": 23
231
+ },
232
+ {
233
+ "epoch": 6.0,
234
+ "grad_norm": 185018.9375,
235
+ "learning_rate": 3.853069612124326e-06,
236
+ "loss": 0.413,
237
+ "step": 24
238
+ },
239
+ {
240
+ "epoch": 6.0,
241
+ "eval_accuracy": 0.7991395935321169,
242
+ "eval_f1": 0.7809061488673139,
243
+ "eval_loss": 0.4188691973686218,
244
+ "eval_precision": 0.7971589032044929,
245
+ "eval_recall": 0.7653028861401839,
246
+ "eval_runtime": 3.7978,
247
+ "eval_samples_per_second": 1774.966,
248
+ "eval_steps_per_second": 1.053,
249
+ "step": 24
250
+ },
251
+ {
252
+ "epoch": 6.25,
253
+ "grad_norm": 113566.4609375,
254
+ "learning_rate": 4.0136141792961726e-06,
255
+ "loss": 0.412,
256
+ "step": 25
257
+ },
258
+ {
259
+ "epoch": 6.5,
260
+ "grad_norm": 261597.5625,
261
+ "learning_rate": 4.1741587464680194e-06,
262
+ "loss": 0.4271,
263
+ "step": 26
264
+ },
265
+ {
266
+ "epoch": 6.75,
267
+ "grad_norm": 322553.15625,
268
+ "learning_rate": 4.334703313639866e-06,
269
+ "loss": 0.4138,
270
+ "step": 27
271
+ },
272
+ {
273
+ "epoch": 7.0,
274
+ "grad_norm": 299670.59375,
275
+ "learning_rate": 4.495247880811713e-06,
276
+ "loss": 0.4336,
277
+ "step": 28
278
+ },
279
+ {
280
+ "epoch": 7.0,
281
+ "eval_accuracy": 0.7982495178756861,
282
+ "eval_f1": 0.7792924375202857,
283
+ "eval_loss": 0.4183463454246521,
284
+ "eval_precision": 0.7979395147889664,
285
+ "eval_recall": 0.7614969869965112,
286
+ "eval_runtime": 3.822,
287
+ "eval_samples_per_second": 1763.716,
288
+ "eval_steps_per_second": 1.047,
289
+ "step": 28
290
+ },
291
+ {
292
+ "epoch": 7.25,
293
+ "grad_norm": 129755.515625,
294
+ "learning_rate": 4.655792447983561e-06,
295
+ "loss": 0.4236,
296
+ "step": 29
297
+ },
298
+ {
299
+ "epoch": 7.5,
300
+ "grad_norm": 149775.578125,
301
+ "learning_rate": 4.816337015155408e-06,
302
+ "loss": 0.4221,
303
+ "step": 30
304
+ },
305
+ {
306
+ "epoch": 7.75,
307
+ "grad_norm": 452987.9375,
308
+ "learning_rate": 4.976881582327254e-06,
309
+ "loss": 0.4276,
310
+ "step": 31
311
+ },
312
+ {
313
+ "epoch": 8.0,
314
+ "grad_norm": 406737.96875,
315
+ "learning_rate": 5.137426149499101e-06,
316
+ "loss": 0.408,
317
+ "step": 32
318
+ },
319
+ {
320
+ "epoch": 8.0,
321
+ "eval_accuracy": 0.7954309449636553,
322
+ "eval_f1": 0.7733026467203682,
323
+ "eval_loss": 0.4189365804195404,
324
+ "eval_precision": 0.8027303754266212,
325
+ "eval_recall": 0.7459562321598477,
326
+ "eval_runtime": 4.1779,
327
+ "eval_samples_per_second": 1613.482,
328
+ "eval_steps_per_second": 0.957,
329
+ "step": 32
330
+ },
331
+ {
332
+ "epoch": 8.25,
333
+ "grad_norm": 173327.0625,
334
+ "learning_rate": 5.297970716670948e-06,
335
+ "loss": 0.4021,
336
+ "step": 33
337
+ },
338
+ {
339
+ "epoch": 8.5,
340
+ "grad_norm": 132129.640625,
341
+ "learning_rate": 5.458515283842794e-06,
342
+ "loss": 0.4216,
343
+ "step": 34
344
+ },
345
+ {
346
+ "epoch": 8.75,
347
+ "grad_norm": 328514.625,
348
+ "learning_rate": 5.619059851014642e-06,
349
+ "loss": 0.4214,
350
+ "step": 35
351
+ },
352
+ {
353
+ "epoch": 9.0,
354
+ "grad_norm": 296242.96875,
355
+ "learning_rate": 5.779604418186488e-06,
356
+ "loss": 0.4328,
357
+ "step": 36
358
+ },
359
+ {
360
+ "epoch": 9.0,
361
+ "eval_accuracy": 0.8003263610740247,
362
+ "eval_f1": 0.7828331719909648,
363
+ "eval_loss": 0.4176911413669586,
364
+ "eval_precision": 0.7967159277504106,
365
+ "eval_recall": 0.7694259435458294,
366
+ "eval_runtime": 3.9359,
367
+ "eval_samples_per_second": 1712.676,
368
+ "eval_steps_per_second": 1.016,
369
+ "step": 36
370
+ },
371
+ {
372
+ "epoch": 9.25,
373
+ "grad_norm": 164642.25,
374
+ "learning_rate": 5.940148985358336e-06,
375
+ "loss": 0.4296,
376
+ "step": 37
377
+ },
378
+ {
379
+ "epoch": 9.5,
380
+ "grad_norm": 386216.90625,
381
+ "learning_rate": 6.100693552530183e-06,
382
+ "loss": 0.4082,
383
+ "step": 38
384
+ },
385
+ {
386
+ "epoch": 9.75,
387
+ "grad_norm": 341470.5625,
388
+ "learning_rate": 6.2612381197020296e-06,
389
+ "loss": 0.4235,
390
+ "step": 39
391
+ },
392
+ {
393
+ "epoch": 10.0,
394
+ "grad_norm": 161297.625,
395
+ "learning_rate": 6.4217826868738764e-06,
396
+ "loss": 0.4109,
397
+ "step": 40
398
+ },
399
+ {
400
+ "epoch": 10.0,
401
+ "eval_accuracy": 0.7982495178756861,
402
+ "eval_f1": 0.7789336801040312,
403
+ "eval_loss": 0.41719672083854675,
404
+ "eval_precision": 0.7989329776592198,
405
+ "eval_recall": 0.7599111956866477,
406
+ "eval_runtime": 3.9721,
407
+ "eval_samples_per_second": 1697.089,
408
+ "eval_steps_per_second": 1.007,
409
+ "step": 40
410
+ },
411
+ {
412
+ "epoch": 10.25,
413
+ "grad_norm": 336130.65625,
414
+ "learning_rate": 6.5823272540457225e-06,
415
+ "loss": 0.4119,
416
+ "step": 41
417
+ },
418
+ {
419
+ "epoch": 10.5,
420
+ "grad_norm": 538575.9375,
421
+ "learning_rate": 6.74287182121757e-06,
422
+ "loss": 0.4189,
423
+ "step": 42
424
+ },
425
+ {
426
+ "epoch": 10.75,
427
+ "grad_norm": 566222.0625,
428
+ "learning_rate": 6.903416388389417e-06,
429
+ "loss": 0.4167,
430
+ "step": 43
431
+ },
432
+ {
433
+ "epoch": 11.0,
434
+ "grad_norm": 502448.53125,
435
+ "learning_rate": 7.063960955561264e-06,
436
+ "loss": 0.4242,
437
+ "step": 44
438
+ },
439
+ {
440
+ "epoch": 11.0,
441
+ "eval_accuracy": 0.8006230529595015,
442
+ "eval_f1": 0.785234899328859,
443
+ "eval_loss": 0.41683289408683777,
444
+ "eval_precision": 0.7913043478260869,
445
+ "eval_recall": 0.7792578496669839,
446
+ "eval_runtime": 4.0247,
447
+ "eval_samples_per_second": 1674.916,
448
+ "eval_steps_per_second": 0.994,
449
+ "step": 44
450
+ },
451
+ {
452
+ "epoch": 11.25,
453
+ "grad_norm": 461244.03125,
454
+ "learning_rate": 7.224505522733111e-06,
455
+ "loss": 0.4241,
456
+ "step": 45
457
+ },
458
+ {
459
+ "epoch": 11.5,
460
+ "grad_norm": 354418.75,
461
+ "learning_rate": 7.385050089904958e-06,
462
+ "loss": 0.4113,
463
+ "step": 46
464
+ },
465
+ {
466
+ "epoch": 11.75,
467
+ "grad_norm": 367365.15625,
468
+ "learning_rate": 7.5455946570768045e-06,
469
+ "loss": 0.4066,
470
+ "step": 47
471
+ },
472
+ {
473
+ "epoch": 12.0,
474
+ "grad_norm": 241178.4375,
475
+ "learning_rate": 7.706139224248651e-06,
476
+ "loss": 0.4237,
477
+ "step": 48
478
+ },
479
+ {
480
+ "epoch": 12.0,
481
+ "eval_accuracy": 0.7964693665628245,
482
+ "eval_f1": 0.7763286599282687,
483
+ "eval_loss": 0.41600093245506287,
484
+ "eval_precision": 0.7987252599798725,
485
+ "eval_recall": 0.7551538217570568,
486
+ "eval_runtime": 4.068,
487
+ "eval_samples_per_second": 1657.071,
488
+ "eval_steps_per_second": 0.983,
489
+ "step": 48
490
+ },
491
+ {
492
+ "epoch": 12.25,
493
+ "grad_norm": 236949.75,
494
+ "learning_rate": 7.866683791420498e-06,
495
+ "loss": 0.4187,
496
+ "step": 49
497
+ },
498
+ {
499
+ "epoch": 12.5,
500
+ "grad_norm": 367486.0,
501
+ "learning_rate": 8.027228358592345e-06,
502
+ "loss": 0.4213,
503
+ "step": 50
504
+ },
505
+ {
506
+ "epoch": 12.75,
507
+ "grad_norm": 594396.3125,
508
+ "learning_rate": 8.187772925764192e-06,
509
+ "loss": 0.4117,
510
+ "step": 51
511
+ },
512
+ {
513
+ "epoch": 13.0,
514
+ "grad_norm": 535547.0,
515
+ "learning_rate": 8.348317492936039e-06,
516
+ "loss": 0.4294,
517
+ "step": 52
518
+ },
519
+ {
520
+ "epoch": 13.0,
521
+ "eval_accuracy": 0.8001780151312862,
522
+ "eval_f1": 0.7838921867479545,
523
+ "eval_loss": 0.4154762029647827,
524
+ "eval_precision": 0.7931818181818182,
525
+ "eval_recall": 0.7748176339993657,
526
+ "eval_runtime": 4.1194,
527
+ "eval_samples_per_second": 1636.391,
528
+ "eval_steps_per_second": 0.971,
529
+ "step": 52
530
+ },
531
+ {
532
+ "epoch": 13.25,
533
+ "grad_norm": 192222.078125,
534
+ "learning_rate": 8.508862060107887e-06,
535
+ "loss": 0.4259,
536
+ "step": 53
537
+ },
538
+ {
539
+ "epoch": 13.5,
540
+ "grad_norm": 169889.9375,
541
+ "learning_rate": 8.669406627279733e-06,
542
+ "loss": 0.4129,
543
+ "step": 54
544
+ },
545
+ {
546
+ "epoch": 13.75,
547
+ "grad_norm": 802483.4375,
548
+ "learning_rate": 8.82995119445158e-06,
549
+ "loss": 0.4143,
550
+ "step": 55
551
+ },
552
+ {
553
+ "epoch": 14.0,
554
+ "grad_norm": 1152123.0,
555
+ "learning_rate": 8.990495761623426e-06,
556
+ "loss": 0.4141,
557
+ "step": 56
558
+ },
559
+ {
560
+ "epoch": 14.0,
561
+ "eval_accuracy": 0.7955792909063937,
562
+ "eval_f1": 0.7706391478029294,
563
+ "eval_loss": 0.41698139905929565,
564
+ "eval_precision": 0.8108581436077058,
565
+ "eval_recall": 0.7342213764668569,
566
+ "eval_runtime": 4.1658,
567
+ "eval_samples_per_second": 1618.183,
568
+ "eval_steps_per_second": 0.96,
569
+ "step": 56
570
+ },
571
+ {
572
+ "epoch": 14.25,
573
+ "grad_norm": 431923.5,
574
+ "learning_rate": 9.151040328795273e-06,
575
+ "loss": 0.4048,
576
+ "step": 57
577
+ },
578
+ {
579
+ "epoch": 14.5,
580
+ "grad_norm": 107792.703125,
581
+ "learning_rate": 9.311584895967122e-06,
582
+ "loss": 0.4099,
583
+ "step": 58
584
+ },
585
+ {
586
+ "epoch": 14.75,
587
+ "grad_norm": 361818.65625,
588
+ "learning_rate": 9.472129463138967e-06,
589
+ "loss": 0.4235,
590
+ "step": 59
591
+ },
592
+ {
593
+ "epoch": 15.0,
594
+ "grad_norm": 672806.375,
595
+ "learning_rate": 9.632674030310815e-06,
596
+ "loss": 0.4233,
597
+ "step": 60
598
+ },
599
+ {
600
+ "epoch": 15.0,
601
+ "eval_accuracy": 0.8018098205014093,
602
+ "eval_f1": 0.7872611464968153,
603
+ "eval_loss": 0.41520848870277405,
604
+ "eval_precision": 0.7905340582027502,
605
+ "eval_recall": 0.7840152235965747,
606
+ "eval_runtime": 4.2184,
607
+ "eval_samples_per_second": 1598.016,
608
+ "eval_steps_per_second": 0.948,
609
+ "step": 60
610
+ }
611
+ ],
612
+ "logging_steps": 1,
613
+ "max_steps": 80,
614
+ "num_input_tokens_seen": 0,
615
+ "num_train_epochs": 20,
616
+ "save_steps": 500,
617
+ "stateful_callbacks": {
618
+ "TrainerControl": {
619
+ "args": {
620
+ "should_epoch_stop": false,
621
+ "should_evaluate": false,
622
+ "should_log": false,
623
+ "should_save": true,
624
+ "should_training_stop": false
625
+ },
626
+ "attributes": {}
627
+ }
628
+ },
629
+ "total_flos": 9208628260945920.0,
630
+ "train_batch_size": 2048,
631
+ "trial_name": null,
632
+ "trial_params": null
633
+ }
checkpoint-60/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a962d081d3ebaf098ba4aae1ae99c3f381953544a4002d54b37e070680980a81
3
+ size 5368
config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "architectures": [
3
  "ViTForImageClassification"
4
  ],
@@ -18,5 +19,5 @@
18
  "patch_size": 4,
19
  "qkv_bias": true,
20
  "torch_dtype": "float32",
21
- "transformers_version": "4.46.1"
22
  }
 
1
  {
2
+ "_name_or_path": "ZivKassnerNK/binary_classification_model_v3.1.3_spines",
3
  "architectures": [
4
  "ViTForImageClassification"
5
  ],
 
19
  "patch_size": 4,
20
  "qkv_bias": true,
21
  "torch_dtype": "float32",
22
+ "transformers_version": "4.46.2"
23
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3763285e8dd082d9840123bbe4a55f1faaefe6dabaa87bbe48938bee65866d2
3
  size 8563512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92713d053262518988d9a71ee99c08290f4284d2816caca747d6ffa93ff0b342
3
  size 8563512
pr_curve.png CHANGED
roc_curve.png CHANGED
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df1535d56f69b10dec594d0116a6d77d9220713be79d301e5d938e5c3d7f1940
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a962d081d3ebaf098ba4aae1ae99c3f381953544a4002d54b37e070680980a81
3
  size 5368