Samrita commited on
Commit
d1c3bf0
·
1 Parent(s): c6f51f6

Upload folder using huggingface_hub

Browse files
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/vit-base-patch16-224-in21k",
3
+ "architectures": [
4
+ "ViTForImageClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "encoder_stride": 16,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.0,
10
+ "hidden_size": 768,
11
+ "id2label": {
12
+ "0": "Bird",
13
+ "1": "Not%20Bird"
14
+ },
15
+ "image_size": 224,
16
+ "initializer_range": 0.02,
17
+ "intermediate_size": 3072,
18
+ "label2id": {
19
+ "Bird": "0",
20
+ "Not%20Bird": "1"
21
+ },
22
+ "layer_norm_eps": 1e-12,
23
+ "model_type": "vit",
24
+ "num_attention_heads": 12,
25
+ "num_channels": 3,
26
+ "num_hidden_layers": 12,
27
+ "patch_size": 16,
28
+ "problem_type": "single_label_classification",
29
+ "qkv_bias": true,
30
+ "torch_dtype": "float32",
31
+ "transformers_version": "4.30.2"
32
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91a1cce1f212cb54f0bf321120c3527ba46f22a629bfc43c735c6cd88947f5b0
3
+ size 686518725
preprocessor_config.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "do_rescale": true,
4
+ "do_resize": true,
5
+ "image_mean": [
6
+ 0.5,
7
+ 0.5,
8
+ 0.5
9
+ ],
10
+ "image_processor_type": "ViTFeatureExtractor",
11
+ "image_std": [
12
+ 0.5,
13
+ 0.5,
14
+ 0.5
15
+ ],
16
+ "resample": 2,
17
+ "rescale_factor": 0.00392156862745098,
18
+ "size": {
19
+ "height": 224,
20
+ "width": 224
21
+ }
22
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c4205743262790b190b68005296aaf0a99a4716bf5e6db0367bca997872f80c
3
+ size 343268717
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37436f57ce55af2e38f65a6281769dc0c5f325a8d66d0317c2e21f39e929b2dc
3
+ size 14575
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa37c7300d657fe4968acd7b02cac1f35b615468d9964d6ae9660eafd9a03b05
3
+ size 627
trainer_state.json ADDED
@@ -0,0 +1,256 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.0413714237511158,
3
+ "best_model_checkpoint": "./Birds-Or-Not/checkpoint-225",
4
+ "epoch": 5.813953488372093,
5
+ "global_step": 250,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.23,
12
+ "learning_rate": 0.0001922480620155039,
13
+ "loss": 0.512,
14
+ "step": 10
15
+ },
16
+ {
17
+ "epoch": 0.47,
18
+ "learning_rate": 0.00018449612403100774,
19
+ "loss": 0.1901,
20
+ "step": 20
21
+ },
22
+ {
23
+ "epoch": 0.58,
24
+ "eval_accuracy": 0.9685863874345549,
25
+ "eval_loss": 0.10355287045240402,
26
+ "eval_runtime": 3.6181,
27
+ "eval_samples_per_second": 52.791,
28
+ "eval_steps_per_second": 6.633,
29
+ "step": 25
30
+ },
31
+ {
32
+ "epoch": 0.7,
33
+ "learning_rate": 0.00017674418604651164,
34
+ "loss": 0.3262,
35
+ "step": 30
36
+ },
37
+ {
38
+ "epoch": 0.93,
39
+ "learning_rate": 0.0001689922480620155,
40
+ "loss": 0.1114,
41
+ "step": 40
42
+ },
43
+ {
44
+ "epoch": 1.16,
45
+ "learning_rate": 0.00016124031007751937,
46
+ "loss": 0.0367,
47
+ "step": 50
48
+ },
49
+ {
50
+ "epoch": 1.16,
51
+ "eval_accuracy": 0.9738219895287958,
52
+ "eval_loss": 0.06718893349170685,
53
+ "eval_runtime": 3.0958,
54
+ "eval_samples_per_second": 61.697,
55
+ "eval_steps_per_second": 7.753,
56
+ "step": 50
57
+ },
58
+ {
59
+ "epoch": 1.4,
60
+ "learning_rate": 0.00015348837209302327,
61
+ "loss": 0.0738,
62
+ "step": 60
63
+ },
64
+ {
65
+ "epoch": 1.63,
66
+ "learning_rate": 0.00014573643410852714,
67
+ "loss": 0.0101,
68
+ "step": 70
69
+ },
70
+ {
71
+ "epoch": 1.74,
72
+ "eval_accuracy": 0.9790575916230366,
73
+ "eval_loss": 0.060171037912368774,
74
+ "eval_runtime": 3.0912,
75
+ "eval_samples_per_second": 61.789,
76
+ "eval_steps_per_second": 7.764,
77
+ "step": 75
78
+ },
79
+ {
80
+ "epoch": 1.86,
81
+ "learning_rate": 0.000137984496124031,
82
+ "loss": 0.0982,
83
+ "step": 80
84
+ },
85
+ {
86
+ "epoch": 2.09,
87
+ "learning_rate": 0.0001302325581395349,
88
+ "loss": 0.0409,
89
+ "step": 90
90
+ },
91
+ {
92
+ "epoch": 2.33,
93
+ "learning_rate": 0.00012248062015503876,
94
+ "loss": 0.0079,
95
+ "step": 100
96
+ },
97
+ {
98
+ "epoch": 2.33,
99
+ "eval_accuracy": 0.9790575916230366,
100
+ "eval_loss": 0.06641152501106262,
101
+ "eval_runtime": 3.0752,
102
+ "eval_samples_per_second": 62.11,
103
+ "eval_steps_per_second": 7.804,
104
+ "step": 100
105
+ },
106
+ {
107
+ "epoch": 2.56,
108
+ "learning_rate": 0.00011472868217054265,
109
+ "loss": 0.0075,
110
+ "step": 110
111
+ },
112
+ {
113
+ "epoch": 2.79,
114
+ "learning_rate": 0.00010697674418604651,
115
+ "loss": 0.0295,
116
+ "step": 120
117
+ },
118
+ {
119
+ "epoch": 2.91,
120
+ "eval_accuracy": 0.9685863874345549,
121
+ "eval_loss": 0.09663180261850357,
122
+ "eval_runtime": 3.2748,
123
+ "eval_samples_per_second": 58.325,
124
+ "eval_steps_per_second": 7.329,
125
+ "step": 125
126
+ },
127
+ {
128
+ "epoch": 3.02,
129
+ "learning_rate": 9.92248062015504e-05,
130
+ "loss": 0.0301,
131
+ "step": 130
132
+ },
133
+ {
134
+ "epoch": 3.26,
135
+ "learning_rate": 9.147286821705426e-05,
136
+ "loss": 0.0095,
137
+ "step": 140
138
+ },
139
+ {
140
+ "epoch": 3.49,
141
+ "learning_rate": 8.372093023255814e-05,
142
+ "loss": 0.0066,
143
+ "step": 150
144
+ },
145
+ {
146
+ "epoch": 3.49,
147
+ "eval_accuracy": 0.9790575916230366,
148
+ "eval_loss": 0.04968209192156792,
149
+ "eval_runtime": 3.1516,
150
+ "eval_samples_per_second": 60.603,
151
+ "eval_steps_per_second": 7.615,
152
+ "step": 150
153
+ },
154
+ {
155
+ "epoch": 3.72,
156
+ "learning_rate": 7.596899224806202e-05,
157
+ "loss": 0.0037,
158
+ "step": 160
159
+ },
160
+ {
161
+ "epoch": 3.95,
162
+ "learning_rate": 6.821705426356589e-05,
163
+ "loss": 0.0036,
164
+ "step": 170
165
+ },
166
+ {
167
+ "epoch": 4.07,
168
+ "eval_accuracy": 0.9842931937172775,
169
+ "eval_loss": 0.06203766167163849,
170
+ "eval_runtime": 3.6519,
171
+ "eval_samples_per_second": 52.302,
172
+ "eval_steps_per_second": 6.572,
173
+ "step": 175
174
+ },
175
+ {
176
+ "epoch": 4.19,
177
+ "learning_rate": 6.0465116279069765e-05,
178
+ "loss": 0.0034,
179
+ "step": 180
180
+ },
181
+ {
182
+ "epoch": 4.42,
183
+ "learning_rate": 5.271317829457365e-05,
184
+ "loss": 0.0033,
185
+ "step": 190
186
+ },
187
+ {
188
+ "epoch": 4.65,
189
+ "learning_rate": 4.496124031007753e-05,
190
+ "loss": 0.0063,
191
+ "step": 200
192
+ },
193
+ {
194
+ "epoch": 4.65,
195
+ "eval_accuracy": 0.9842931937172775,
196
+ "eval_loss": 0.0426977165043354,
197
+ "eval_runtime": 3.2933,
198
+ "eval_samples_per_second": 57.997,
199
+ "eval_steps_per_second": 7.288,
200
+ "step": 200
201
+ },
202
+ {
203
+ "epoch": 4.88,
204
+ "learning_rate": 3.7209302325581394e-05,
205
+ "loss": 0.003,
206
+ "step": 210
207
+ },
208
+ {
209
+ "epoch": 5.12,
210
+ "learning_rate": 2.9457364341085275e-05,
211
+ "loss": 0.0029,
212
+ "step": 220
213
+ },
214
+ {
215
+ "epoch": 5.23,
216
+ "eval_accuracy": 0.9842931937172775,
217
+ "eval_loss": 0.0413714237511158,
218
+ "eval_runtime": 3.0838,
219
+ "eval_samples_per_second": 61.937,
220
+ "eval_steps_per_second": 7.783,
221
+ "step": 225
222
+ },
223
+ {
224
+ "epoch": 5.35,
225
+ "learning_rate": 2.170542635658915e-05,
226
+ "loss": 0.0029,
227
+ "step": 230
228
+ },
229
+ {
230
+ "epoch": 5.58,
231
+ "learning_rate": 1.3953488372093024e-05,
232
+ "loss": 0.0028,
233
+ "step": 240
234
+ },
235
+ {
236
+ "epoch": 5.81,
237
+ "learning_rate": 6.2015503875969e-06,
238
+ "loss": 0.0028,
239
+ "step": 250
240
+ },
241
+ {
242
+ "epoch": 5.81,
243
+ "eval_accuracy": 0.9842931937172775,
244
+ "eval_loss": 0.041494447737932205,
245
+ "eval_runtime": 3.5969,
246
+ "eval_samples_per_second": 53.102,
247
+ "eval_steps_per_second": 6.672,
248
+ "step": 250
249
+ }
250
+ ],
251
+ "max_steps": 258,
252
+ "num_train_epochs": 6,
253
+ "total_flos": 3.09967958458368e+17,
254
+ "trial_name": null,
255
+ "trial_params": null
256
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb7d7333348598c79ca1dc5993603769a73b7cc5c238d4dfddf5b1ec3ab43f59
3
+ size 3899