sksatyam commited on
Commit
41fc1b4
·
verified ·
1 Parent(s): 52dcb2c

🍻 cheers

Browse files
README.md CHANGED
@@ -3,6 +3,7 @@ library_name: transformers
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224-in21k
5
  tags:
 
6
  - generated_from_trainer
7
  datasets:
8
  - imagefolder
@@ -15,7 +16,7 @@ model-index:
15
  name: Image Classification
16
  type: image-classification
17
  dataset:
18
- name: imagefolder
19
  type: imagefolder
20
  config: default
21
  split: train
@@ -31,7 +32,7 @@ should probably proofread and complete it, then remove this comment. -->
31
 
32
  # finetuned-websites
33
 
34
- This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
  - Loss: 0.8349
37
  - Accuracy: 0.75
 
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224-in21k
5
  tags:
6
+ - image-classification
7
  - generated_from_trainer
8
  datasets:
9
  - imagefolder
 
16
  name: Image Classification
17
  type: image-classification
18
  dataset:
19
+ name: finetuned-websites
20
  type: imagefolder
21
  config: default
22
  split: train
 
32
 
33
  # finetuned-websites
34
 
35
+ This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the finetuned-websites dataset.
36
  It achieves the following results on the evaluation set:
37
  - Loss: 0.8349
38
  - Accuracy: 0.75
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_accuracy": 0.39705882352941174,
4
- "eval_loss": 1.5659970045089722,
5
- "eval_runtime": 3.0691,
6
- "eval_samples_per_second": 22.156,
7
- "eval_steps_per_second": 2.932,
8
  "total_flos": 2.9603266596900864e+17,
9
- "train_loss": 1.4860339760780334,
10
- "train_runtime": 184.3796,
11
- "train_samples_per_second": 20.718,
12
- "train_steps_per_second": 1.302
13
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_accuracy": 0.75,
4
+ "eval_loss": 0.8348819613456726,
5
+ "eval_runtime": 3.7302,
6
+ "eval_samples_per_second": 18.23,
7
+ "eval_steps_per_second": 2.413,
8
  "total_flos": 2.9603266596900864e+17,
9
+ "train_loss": 0.6847666402657827,
10
+ "train_runtime": 183.3512,
11
+ "train_samples_per_second": 20.834,
12
+ "train_steps_per_second": 1.309
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_accuracy": 0.39705882352941174,
4
- "eval_loss": 1.5659970045089722,
5
- "eval_runtime": 3.0691,
6
- "eval_samples_per_second": 22.156,
7
- "eval_steps_per_second": 2.932
8
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_accuracy": 0.75,
4
+ "eval_loss": 0.8348819613456726,
5
+ "eval_runtime": 3.7302,
6
+ "eval_samples_per_second": 18.23,
7
+ "eval_steps_per_second": 2.413
8
  }
runs/Dec05_12-11-38_edab03f22c59/events.out.tfevents.1733400953.edab03f22c59.4058.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ff60e75deea3850000873a6821a2bfe39847ef82669f7f2152048dac3d26cd2
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
  "total_flos": 2.9603266596900864e+17,
4
- "train_loss": 1.4860339760780334,
5
- "train_runtime": 184.3796,
6
- "train_samples_per_second": 20.718,
7
- "train_steps_per_second": 1.302
8
  }
 
1
  {
2
  "epoch": 10.0,
3
  "total_flos": 2.9603266596900864e+17,
4
+ "train_loss": 0.6847666402657827,
5
+ "train_runtime": 183.3512,
6
+ "train_samples_per_second": 20.834,
7
+ "train_steps_per_second": 1.309
8
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 1.5659970045089722,
3
  "best_model_checkpoint": "finetuned-websites/checkpoint-200",
4
  "epoch": 10.0,
5
- "eval_steps": 50,
6
  "global_step": 240,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
@@ -10,223 +10,205 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.4166666666666667,
13
- "grad_norm": 4.125311851501465,
14
- "learning_rate": 1.0000000000000002e-06,
15
- "loss": 1.9272,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.8333333333333334,
20
- "grad_norm": 3.0228281021118164,
21
- "learning_rate": 2.0000000000000003e-06,
22
- "loss": 1.928,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 1.25,
27
- "grad_norm": 2.5070629119873047,
28
- "learning_rate": 3e-06,
29
- "loss": 1.921,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 1.6666666666666665,
34
- "grad_norm": 2.7787866592407227,
35
- "learning_rate": 4.000000000000001e-06,
36
- "loss": 1.8972,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 2.0833333333333335,
41
- "grad_norm": 2.7862040996551514,
42
- "learning_rate": 5e-06,
43
- "loss": 1.8678,
44
- "step": 50
45
- },
46
- {
47
- "epoch": 2.0833333333333335,
48
- "eval_accuracy": 0.3088235294117647,
49
- "eval_loss": 1.8965561389923096,
50
- "eval_runtime": 2.6013,
51
- "eval_samples_per_second": 26.141,
52
- "eval_steps_per_second": 3.46,
53
  "step": 50
54
  },
55
  {
56
  "epoch": 2.5,
57
- "grad_norm": 3.540709972381592,
58
- "learning_rate": 6e-06,
59
- "loss": 1.8526,
60
  "step": 60
61
  },
62
  {
63
  "epoch": 2.9166666666666665,
64
- "grad_norm": 3.426781415939331,
65
- "learning_rate": 7.000000000000001e-06,
66
- "loss": 1.8198,
67
  "step": 70
68
  },
69
  {
70
  "epoch": 3.3333333333333335,
71
- "grad_norm": 4.007580757141113,
72
- "learning_rate": 8.000000000000001e-06,
73
- "loss": 1.7369,
74
  "step": 80
75
  },
76
  {
77
  "epoch": 3.75,
78
- "grad_norm": 4.467859745025635,
79
- "learning_rate": 9e-06,
80
- "loss": 1.7144,
81
  "step": 90
82
  },
83
  {
84
  "epoch": 4.166666666666667,
85
- "grad_norm": 3.9431729316711426,
86
- "learning_rate": 1e-05,
87
- "loss": 1.6483,
88
  "step": 100
89
  },
90
  {
91
  "epoch": 4.166666666666667,
92
- "eval_accuracy": 0.3382352941176471,
93
- "eval_loss": 1.793816089630127,
94
- "eval_runtime": 2.9764,
95
- "eval_samples_per_second": 22.847,
96
- "eval_steps_per_second": 3.024,
97
  "step": 100
98
  },
99
  {
100
  "epoch": 4.583333333333333,
101
- "grad_norm": 3.2608771324157715,
102
- "learning_rate": 1.1000000000000001e-05,
103
- "loss": 1.5856,
104
  "step": 110
105
  },
106
  {
107
  "epoch": 5.0,
108
- "grad_norm": 3.638972520828247,
109
- "learning_rate": 1.2e-05,
110
- "loss": 1.5157,
111
  "step": 120
112
  },
113
  {
114
  "epoch": 5.416666666666667,
115
- "grad_norm": 3.3878164291381836,
116
- "learning_rate": 1.3000000000000001e-05,
117
- "loss": 1.4388,
118
  "step": 130
119
  },
120
  {
121
  "epoch": 5.833333333333333,
122
- "grad_norm": 4.086641311645508,
123
- "learning_rate": 1.4000000000000001e-05,
124
- "loss": 1.4522,
125
  "step": 140
126
  },
127
  {
128
  "epoch": 6.25,
129
- "grad_norm": 3.5550928115844727,
130
- "learning_rate": 1.5e-05,
131
- "loss": 1.3419,
132
- "step": 150
133
- },
134
- {
135
- "epoch": 6.25,
136
- "eval_accuracy": 0.38235294117647056,
137
- "eval_loss": 1.6614487171173096,
138
- "eval_runtime": 2.1852,
139
- "eval_samples_per_second": 31.118,
140
- "eval_steps_per_second": 4.119,
141
  "step": 150
142
  },
143
  {
144
  "epoch": 6.666666666666667,
145
- "grad_norm": 4.774816036224365,
146
- "learning_rate": 1.6000000000000003e-05,
147
- "loss": 1.3147,
148
  "step": 160
149
  },
150
  {
151
  "epoch": 7.083333333333333,
152
- "grad_norm": 4.092309951782227,
153
- "learning_rate": 1.7000000000000003e-05,
154
- "loss": 1.2643,
155
  "step": 170
156
  },
157
  {
158
  "epoch": 7.5,
159
- "grad_norm": 4.992920398712158,
160
- "learning_rate": 1.8e-05,
161
- "loss": 1.1924,
162
  "step": 180
163
  },
164
  {
165
  "epoch": 7.916666666666667,
166
- "grad_norm": 6.251681327819824,
167
- "learning_rate": 1.9e-05,
168
- "loss": 1.1461,
169
  "step": 190
170
  },
171
  {
172
  "epoch": 8.333333333333334,
173
- "grad_norm": 5.500473499298096,
174
- "learning_rate": 2e-05,
175
- "loss": 1.1189,
176
  "step": 200
177
  },
178
  {
179
  "epoch": 8.333333333333334,
180
- "eval_accuracy": 0.39705882352941174,
181
- "eval_loss": 1.5659970045089722,
182
- "eval_runtime": 2.0786,
183
- "eval_samples_per_second": 32.715,
184
- "eval_steps_per_second": 4.33,
185
  "step": 200
186
  },
187
  {
188
  "epoch": 8.75,
189
- "grad_norm": 4.436168670654297,
190
- "learning_rate": 2.1e-05,
191
- "loss": 1.0734,
192
  "step": 210
193
  },
194
  {
195
  "epoch": 9.166666666666666,
196
- "grad_norm": 4.706101417541504,
197
- "learning_rate": 2.2000000000000003e-05,
198
- "loss": 0.9833,
199
  "step": 220
200
  },
201
  {
202
  "epoch": 9.583333333333334,
203
- "grad_norm": 4.173801898956299,
204
- "learning_rate": 2.3000000000000003e-05,
205
- "loss": 0.9902,
206
  "step": 230
207
  },
208
  {
209
  "epoch": 10.0,
210
- "grad_norm": 5.312504291534424,
211
- "learning_rate": 2.4e-05,
212
- "loss": 0.9339,
213
  "step": 240
214
  },
215
  {
216
  "epoch": 10.0,
217
  "step": 240,
218
  "total_flos": 2.9603266596900864e+17,
219
- "train_loss": 1.4860339760780334,
220
- "train_runtime": 184.3796,
221
- "train_samples_per_second": 20.718,
222
- "train_steps_per_second": 1.302
223
  }
224
  ],
225
  "logging_steps": 10,
226
  "max_steps": 240,
227
  "num_input_tokens_seen": 0,
228
  "num_train_epochs": 10,
229
- "save_steps": 50,
230
  "stateful_callbacks": {
231
  "TrainerControl": {
232
  "args": {
 
1
  {
2
+ "best_metric": 0.8348819613456726,
3
  "best_model_checkpoint": "finetuned-websites/checkpoint-200",
4
  "epoch": 10.0,
5
+ "eval_steps": 100,
6
  "global_step": 240,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.4166666666666667,
13
+ "grad_norm": 6.133713722229004,
14
+ "learning_rate": 1e-05,
15
+ "loss": 1.0596,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.8333333333333334,
20
+ "grad_norm": 5.39012336730957,
21
+ "learning_rate": 2e-05,
22
+ "loss": 1.0523,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 1.25,
27
+ "grad_norm": 4.8409881591796875,
28
+ "learning_rate": 3e-05,
29
+ "loss": 1.02,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 1.6666666666666665,
34
+ "grad_norm": 5.128672122955322,
35
+ "learning_rate": 4e-05,
36
+ "loss": 0.9759,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 2.0833333333333335,
41
+ "grad_norm": 6.329381465911865,
42
+ "learning_rate": 5e-05,
43
+ "loss": 0.9153,
 
 
 
 
 
 
 
 
 
44
  "step": 50
45
  },
46
  {
47
  "epoch": 2.5,
48
+ "grad_norm": 6.218069076538086,
49
+ "learning_rate": 6e-05,
50
+ "loss": 0.8539,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 2.9166666666666665,
55
+ "grad_norm": 5.5271430015563965,
56
+ "learning_rate": 7.000000000000001e-05,
57
+ "loss": 0.8747,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 3.3333333333333335,
62
+ "grad_norm": 8.148289680480957,
63
+ "learning_rate": 8e-05,
64
+ "loss": 0.7716,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 3.75,
69
+ "grad_norm": 5.050111293792725,
70
+ "learning_rate": 8.9e-05,
71
+ "loss": 0.8763,
72
  "step": 90
73
  },
74
  {
75
  "epoch": 4.166666666666667,
76
+ "grad_norm": 5.70500373840332,
77
+ "learning_rate": 9.900000000000001e-05,
78
+ "loss": 0.6802,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 4.166666666666667,
83
+ "eval_accuracy": 0.5735294117647058,
84
+ "eval_loss": 1.2561215162277222,
85
+ "eval_runtime": 2.1458,
86
+ "eval_samples_per_second": 31.69,
87
+ "eval_steps_per_second": 4.194,
88
  "step": 100
89
  },
90
  {
91
  "epoch": 4.583333333333333,
92
+ "grad_norm": 6.188072204589844,
93
+ "learning_rate": 0.000109,
94
+ "loss": 0.6251,
95
  "step": 110
96
  },
97
  {
98
  "epoch": 5.0,
99
+ "grad_norm": 9.144834518432617,
100
+ "learning_rate": 0.00011899999999999999,
101
+ "loss": 0.6689,
102
  "step": 120
103
  },
104
  {
105
  "epoch": 5.416666666666667,
106
+ "grad_norm": 5.840977668762207,
107
+ "learning_rate": 0.00012900000000000002,
108
+ "loss": 0.5262,
109
  "step": 130
110
  },
111
  {
112
  "epoch": 5.833333333333333,
113
+ "grad_norm": 22.520524978637695,
114
+ "learning_rate": 0.00013900000000000002,
115
+ "loss": 0.6559,
116
  "step": 140
117
  },
118
  {
119
  "epoch": 6.25,
120
+ "grad_norm": 7.3676676750183105,
121
+ "learning_rate": 0.000149,
122
+ "loss": 0.5186,
 
 
 
 
 
 
 
 
 
123
  "step": 150
124
  },
125
  {
126
  "epoch": 6.666666666666667,
127
+ "grad_norm": 16.96535873413086,
128
+ "learning_rate": 0.00015900000000000002,
129
+ "loss": 0.4291,
130
  "step": 160
131
  },
132
  {
133
  "epoch": 7.083333333333333,
134
+ "grad_norm": 4.878167629241943,
135
+ "learning_rate": 0.00016900000000000002,
136
+ "loss": 0.6311,
137
  "step": 170
138
  },
139
  {
140
  "epoch": 7.5,
141
+ "grad_norm": 5.731603145599365,
142
+ "learning_rate": 0.000179,
143
+ "loss": 0.4274,
144
  "step": 180
145
  },
146
  {
147
  "epoch": 7.916666666666667,
148
+ "grad_norm": 12.268874168395996,
149
+ "learning_rate": 0.000189,
150
+ "loss": 0.3916,
151
  "step": 190
152
  },
153
  {
154
  "epoch": 8.333333333333334,
155
+ "grad_norm": 19.5472469329834,
156
+ "learning_rate": 0.000199,
157
+ "loss": 0.3727,
158
  "step": 200
159
  },
160
  {
161
  "epoch": 8.333333333333334,
162
+ "eval_accuracy": 0.75,
163
+ "eval_loss": 0.8348819613456726,
164
+ "eval_runtime": 2.0932,
165
+ "eval_samples_per_second": 32.486,
166
+ "eval_steps_per_second": 4.3,
167
  "step": 200
168
  },
169
  {
170
  "epoch": 8.75,
171
+ "grad_norm": 9.300850868225098,
172
+ "learning_rate": 0.00020899999999999998,
173
+ "loss": 0.5022,
174
  "step": 210
175
  },
176
  {
177
  "epoch": 9.166666666666666,
178
+ "grad_norm": 2.52441668510437,
179
+ "learning_rate": 0.000219,
180
+ "loss": 0.3873,
181
  "step": 220
182
  },
183
  {
184
  "epoch": 9.583333333333334,
185
+ "grad_norm": 7.8756794929504395,
186
+ "learning_rate": 0.000229,
187
+ "loss": 0.5663,
188
  "step": 230
189
  },
190
  {
191
  "epoch": 10.0,
192
+ "grad_norm": 7.985933780670166,
193
+ "learning_rate": 0.00023899999999999998,
194
+ "loss": 0.6521,
195
  "step": 240
196
  },
197
  {
198
  "epoch": 10.0,
199
  "step": 240,
200
  "total_flos": 2.9603266596900864e+17,
201
+ "train_loss": 0.6847666402657827,
202
+ "train_runtime": 183.3512,
203
+ "train_samples_per_second": 20.834,
204
+ "train_steps_per_second": 1.309
205
  }
206
  ],
207
  "logging_steps": 10,
208
  "max_steps": 240,
209
  "num_input_tokens_seen": 0,
210
  "num_train_epochs": 10,
211
+ "save_steps": 100,
212
  "stateful_callbacks": {
213
  "TrainerControl": {
214
  "args": {