dima806 commited on
Commit
0ebac69
1 Parent(s): e662121

Upload folder using huggingface_hub

Browse files
checkpoint-10945/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6348eb719a7297b32f9d505e6faae70879959d90f18a0eae8ee09a1cd305ea5f
3
  size 343525432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f555c6b4b8c1e7bfe5a6641ceb011bba582f38f38b9118718e30876fe535b20
3
  size 343525432
checkpoint-10945/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5969427d9bb485c2d9609b0123b21ee458bb8dca1a04261596cd9f589d71d449
3
  size 687171333
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c53470a91547570b2c51d204f335b50d27b9315080f02b7cedde0584f51e9462
3
  size 687171333
checkpoint-10945/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.5650318264961243,
3
  "best_model_checkpoint": "mushrooms_image_detection/checkpoint-10945",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,158 +10,158 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.05,
13
- "grad_norm": 2.6588985919952393,
14
  "learning_rate": 1.9173932996787516e-07,
15
- "loss": 0.647,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.09,
20
- "grad_norm": 6.133805274963379,
21
  "learning_rate": 1.825608077099587e-07,
22
- "loss": 0.6472,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.14,
27
- "grad_norm": 5.8800435066223145,
28
  "learning_rate": 1.733822854520422e-07,
29
- "loss": 0.6606,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.18,
34
- "grad_norm": 3.6122307777404785,
35
  "learning_rate": 1.6420376319412576e-07,
36
- "loss": 0.6485,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.23,
41
- "grad_norm": 6.25240421295166,
42
  "learning_rate": 1.5502524093620926e-07,
43
- "loss": 0.6434,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.27,
48
- "grad_norm": 3.467872142791748,
49
  "learning_rate": 1.458467186782928e-07,
50
- "loss": 0.6129,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.32,
55
- "grad_norm": 6.264642715454102,
56
  "learning_rate": 1.366681964203763e-07,
57
- "loss": 0.6313,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.37,
62
- "grad_norm": 4.573624134063721,
63
  "learning_rate": 1.2748967416245983e-07,
64
- "loss": 0.6412,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.41,
69
- "grad_norm": 5.538139820098877,
70
  "learning_rate": 1.1831115190454337e-07,
71
- "loss": 0.6479,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.46,
76
- "grad_norm": 5.533720970153809,
77
  "learning_rate": 1.0913262964662688e-07,
78
- "loss": 0.6294,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.5,
83
- "grad_norm": 7.556946754455566,
84
  "learning_rate": 9.995410738871042e-08,
85
- "loss": 0.6289,
86
  "step": 5500
87
  },
88
  {
89
  "epoch": 0.55,
90
- "grad_norm": 5.644389629364014,
91
  "learning_rate": 9.077558513079394e-08,
92
- "loss": 0.6224,
93
  "step": 6000
94
  },
95
  {
96
  "epoch": 0.59,
97
- "grad_norm": 3.989530086517334,
98
  "learning_rate": 8.159706287287747e-08,
99
- "loss": 0.6337,
100
  "step": 6500
101
  },
102
  {
103
  "epoch": 0.64,
104
- "grad_norm": 11.623241424560547,
105
  "learning_rate": 7.241854061496099e-08,
106
- "loss": 0.6231,
107
  "step": 7000
108
  },
109
  {
110
  "epoch": 0.69,
111
- "grad_norm": 5.611315727233887,
112
  "learning_rate": 6.32400183570445e-08,
113
- "loss": 0.6219,
114
  "step": 7500
115
  },
116
  {
117
  "epoch": 0.73,
118
- "grad_norm": 5.866851329803467,
119
  "learning_rate": 5.406149609912804e-08,
120
- "loss": 0.631,
121
  "step": 8000
122
  },
123
  {
124
  "epoch": 0.78,
125
- "grad_norm": 4.226177215576172,
126
  "learning_rate": 4.488297384121156e-08,
127
- "loss": 0.632,
128
  "step": 8500
129
  },
130
  {
131
  "epoch": 0.82,
132
- "grad_norm": 5.706874370574951,
133
  "learning_rate": 3.5704451583295086e-08,
134
- "loss": 0.6222,
135
  "step": 9000
136
  },
137
  {
138
  "epoch": 0.87,
139
- "grad_norm": 8.87269401550293,
140
  "learning_rate": 2.6525929325378617e-08,
141
- "loss": 0.6333,
142
  "step": 9500
143
  },
144
  {
145
  "epoch": 0.91,
146
- "grad_norm": 6.855080604553223,
147
  "learning_rate": 1.7347407067462138e-08,
148
- "loss": 0.635,
149
  "step": 10000
150
  },
151
  {
152
  "epoch": 0.96,
153
- "grad_norm": 12.029609680175781,
154
  "learning_rate": 8.168884809545663e-09,
155
- "loss": 0.6388,
156
  "step": 10500
157
  },
158
  {
159
  "epoch": 1.0,
160
- "eval_accuracy": 0.8963294500599623,
161
- "eval_loss": 0.5650318264961243,
162
- "eval_runtime": 2859.1049,
163
- "eval_samples_per_second": 81.662,
164
- "eval_steps_per_second": 10.208,
165
  "step": 10945
166
  }
167
  ],
 
1
  {
2
+ "best_metric": 0.5469852685928345,
3
  "best_model_checkpoint": "mushrooms_image_detection/checkpoint-10945",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.05,
13
+ "grad_norm": 6.199071407318115,
14
  "learning_rate": 1.9173932996787516e-07,
15
+ "loss": 0.6273,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.09,
20
+ "grad_norm": 6.411447048187256,
21
  "learning_rate": 1.825608077099587e-07,
22
+ "loss": 0.6283,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.14,
27
+ "grad_norm": 6.0922088623046875,
28
  "learning_rate": 1.733822854520422e-07,
29
+ "loss": 0.6121,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.18,
34
+ "grad_norm": 5.242175579071045,
35
  "learning_rate": 1.6420376319412576e-07,
36
+ "loss": 0.6357,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.23,
41
+ "grad_norm": 5.726295471191406,
42
  "learning_rate": 1.5502524093620926e-07,
43
+ "loss": 0.6094,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.27,
48
+ "grad_norm": 7.89302921295166,
49
  "learning_rate": 1.458467186782928e-07,
50
+ "loss": 0.6297,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.32,
55
+ "grad_norm": 6.494805812835693,
56
  "learning_rate": 1.366681964203763e-07,
57
+ "loss": 0.6104,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.37,
62
+ "grad_norm": 6.374981880187988,
63
  "learning_rate": 1.2748967416245983e-07,
64
+ "loss": 0.6111,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.41,
69
+ "grad_norm": 8.1451416015625,
70
  "learning_rate": 1.1831115190454337e-07,
71
+ "loss": 0.6039,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.46,
76
+ "grad_norm": 7.26981258392334,
77
  "learning_rate": 1.0913262964662688e-07,
78
+ "loss": 0.6102,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.5,
83
+ "grad_norm": 7.569005966186523,
84
  "learning_rate": 9.995410738871042e-08,
85
+ "loss": 0.6167,
86
  "step": 5500
87
  },
88
  {
89
  "epoch": 0.55,
90
+ "grad_norm": 3.174710750579834,
91
  "learning_rate": 9.077558513079394e-08,
92
+ "loss": 0.6036,
93
  "step": 6000
94
  },
95
  {
96
  "epoch": 0.59,
97
+ "grad_norm": 6.182538986206055,
98
  "learning_rate": 8.159706287287747e-08,
99
+ "loss": 0.6166,
100
  "step": 6500
101
  },
102
  {
103
  "epoch": 0.64,
104
+ "grad_norm": 8.289917945861816,
105
  "learning_rate": 7.241854061496099e-08,
106
+ "loss": 0.6227,
107
  "step": 7000
108
  },
109
  {
110
  "epoch": 0.69,
111
+ "grad_norm": 4.353749752044678,
112
  "learning_rate": 6.32400183570445e-08,
113
+ "loss": 0.6204,
114
  "step": 7500
115
  },
116
  {
117
  "epoch": 0.73,
118
+ "grad_norm": 7.799861431121826,
119
  "learning_rate": 5.406149609912804e-08,
120
+ "loss": 0.6079,
121
  "step": 8000
122
  },
123
  {
124
  "epoch": 0.78,
125
+ "grad_norm": 9.668302536010742,
126
  "learning_rate": 4.488297384121156e-08,
127
+ "loss": 0.6149,
128
  "step": 8500
129
  },
130
  {
131
  "epoch": 0.82,
132
+ "grad_norm": 6.9307451248168945,
133
  "learning_rate": 3.5704451583295086e-08,
134
+ "loss": 0.6046,
135
  "step": 9000
136
  },
137
  {
138
  "epoch": 0.87,
139
+ "grad_norm": 14.261872291564941,
140
  "learning_rate": 2.6525929325378617e-08,
141
+ "loss": 0.6073,
142
  "step": 9500
143
  },
144
  {
145
  "epoch": 0.91,
146
+ "grad_norm": 7.5108466148376465,
147
  "learning_rate": 1.7347407067462138e-08,
148
+ "loss": 0.6144,
149
  "step": 10000
150
  },
151
  {
152
  "epoch": 0.96,
153
+ "grad_norm": 5.3811516761779785,
154
  "learning_rate": 8.168884809545663e-09,
155
+ "loss": 0.613,
156
  "step": 10500
157
  },
158
  {
159
  "epoch": 1.0,
160
+ "eval_accuracy": 0.899032037005311,
161
+ "eval_loss": 0.5469852685928345,
162
+ "eval_runtime": 2983.2159,
163
+ "eval_samples_per_second": 78.265,
164
+ "eval_steps_per_second": 9.783,
165
  "step": 10945
166
  }
167
  ],
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6348eb719a7297b32f9d505e6faae70879959d90f18a0eae8ee09a1cd305ea5f
3
  size 343525432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f555c6b4b8c1e7bfe5a6641ceb011bba582f38f38b9118718e30876fe535b20
3
  size 343525432