dima806 commited on
Commit
12ebfff
·
verified ·
1 Parent(s): f7836c6

Upload folder using huggingface_hub

Browse files
checkpoint-9376/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac667f9891e096b94eec6a038cc2967f2cd9d88254165edf42d05ba621ba1c7a
3
  size 343245508
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1265d8e5a8a363a615898be873c224aebc6f310654bf23b1745da0975a7b7555
3
  size 343245508
checkpoint-9376/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2297f022db5d3507731ee0645ef4ac9a9d0d10e51c904f9c64f2bb393f4d7fed
3
  size 686611898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db14e1baf0fce1ab79882476b9e400854724970e5adf6d8b17ef6d264fad3b22
3
  size 686611898
checkpoint-9376/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19ef57ca7ce01a08a3ddc4d19049becd27a3d4c36511ddeaa3a26bb44693aa91
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:162830a25651b28da57d4375090a0500b22eb117bbfd79d4a2bf61dd85a56833
3
  size 1064
checkpoint-9376/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 1.0641573667526245,
3
  "best_model_checkpoint": "fairface_age_image_detection/checkpoint-9376",
4
  "epoch": 4.0,
5
  "eval_steps": 500,
@@ -10,168 +10,168 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.21331058020477817,
13
- "grad_norm": 1.7275338172912598,
14
- "learning_rate": 2.855243405532919e-06,
15
- "loss": 1.8728,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.42662116040955633,
20
- "grad_norm": 2.228030204772949,
21
- "learning_rate": 2.6944027450139397e-06,
22
- "loss": 1.4714,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.6399317406143344,
27
- "grad_norm": 2.2512168884277344,
28
- "learning_rate": 2.5335620844949606e-06,
29
- "loss": 1.3358,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.8532423208191127,
34
- "grad_norm": 3.124258279800415,
35
- "learning_rate": 2.372721423975981e-06,
36
- "loss": 1.264,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 1.0,
41
- "eval_accuracy": 0.5423,
42
- "eval_loss": 1.2151408195495605,
43
- "eval_model_preparation_time": 0.0043,
44
- "eval_runtime": 907.0206,
45
- "eval_samples_per_second": 11.025,
46
- "eval_steps_per_second": 1.378,
47
  "step": 2344
48
  },
49
  {
50
  "epoch": 1.0665529010238908,
51
- "grad_norm": 5.8204874992370605,
52
- "learning_rate": 2.211880763457002e-06,
53
- "loss": 1.2174,
54
  "step": 2500
55
  },
56
  {
57
  "epoch": 1.2798634812286689,
58
- "grad_norm": 5.175824165344238,
59
- "learning_rate": 2.051040102938023e-06,
60
- "loss": 1.171,
61
  "step": 3000
62
  },
63
  {
64
  "epoch": 1.493174061433447,
65
- "grad_norm": 3.312744617462158,
66
- "learning_rate": 1.8901994424190437e-06,
67
- "loss": 1.1425,
68
  "step": 3500
69
  },
70
  {
71
  "epoch": 1.7064846416382253,
72
- "grad_norm": 4.630620002746582,
73
- "learning_rate": 1.7293587819000642e-06,
74
- "loss": 1.1267,
75
  "step": 4000
76
  },
77
  {
78
  "epoch": 1.9197952218430034,
79
- "grad_norm": 3.5600452423095703,
80
- "learning_rate": 1.5685181213810853e-06,
81
- "loss": 1.1051,
82
  "step": 4500
83
  },
84
  {
85
  "epoch": 2.0,
86
- "eval_accuracy": 0.5688,
87
- "eval_loss": 1.1124917268753052,
88
- "eval_model_preparation_time": 0.0043,
89
- "eval_runtime": 915.0894,
90
- "eval_samples_per_second": 10.928,
91
- "eval_steps_per_second": 1.366,
92
  "step": 4688
93
  },
94
  {
95
  "epoch": 2.1331058020477816,
96
- "grad_norm": 7.453662395477295,
97
- "learning_rate": 1.407677460862106e-06,
98
- "loss": 1.0871,
99
  "step": 5000
100
  },
101
  {
102
  "epoch": 2.34641638225256,
103
- "grad_norm": 8.157800674438477,
104
- "learning_rate": 1.2468368003431269e-06,
105
- "loss": 1.0696,
106
  "step": 5500
107
  },
108
  {
109
  "epoch": 2.5597269624573378,
110
- "grad_norm": 3.6688616275787354,
111
- "learning_rate": 1.0859961398241475e-06,
112
- "loss": 1.0571,
113
  "step": 6000
114
  },
115
  {
116
  "epoch": 2.773037542662116,
117
- "grad_norm": 3.1099190711975098,
118
- "learning_rate": 9.251554793051683e-07,
119
- "loss": 1.0476,
120
  "step": 6500
121
  },
122
  {
123
  "epoch": 2.986348122866894,
124
- "grad_norm": 5.784822463989258,
125
- "learning_rate": 7.643148187861893e-07,
126
- "loss": 1.0407,
127
  "step": 7000
128
  },
129
  {
130
  "epoch": 3.0,
131
- "eval_accuracy": 0.5756,
132
- "eval_loss": 1.0761935710906982,
133
- "eval_model_preparation_time": 0.0043,
134
- "eval_runtime": 920.0161,
135
- "eval_samples_per_second": 10.869,
136
- "eval_steps_per_second": 1.359,
137
  "step": 7032
138
  },
139
  {
140
  "epoch": 3.1996587030716723,
141
- "grad_norm": 5.856372833251953,
142
- "learning_rate": 6.0347415826721e-07,
143
- "loss": 1.0212,
144
  "step": 7500
145
  },
146
  {
147
  "epoch": 3.4129692832764507,
148
- "grad_norm": 5.725022792816162,
149
- "learning_rate": 4.426334977482307e-07,
150
- "loss": 1.0253,
151
  "step": 8000
152
  },
153
  {
154
  "epoch": 3.6262798634812285,
155
- "grad_norm": 4.74147891998291,
156
- "learning_rate": 2.8179283722925154e-07,
157
- "loss": 1.0232,
158
  "step": 8500
159
  },
160
  {
161
  "epoch": 3.839590443686007,
162
- "grad_norm": 4.050413131713867,
163
- "learning_rate": 1.2095217671027237e-07,
164
- "loss": 1.0173,
165
  "step": 9000
166
  },
167
  {
168
  "epoch": 4.0,
169
- "eval_accuracy": 0.5791,
170
- "eval_loss": 1.0641573667526245,
171
- "eval_model_preparation_time": 0.0043,
172
- "eval_runtime": 919.3696,
173
- "eval_samples_per_second": 10.877,
174
- "eval_steps_per_second": 1.36,
175
  "step": 9376
176
  }
177
  ],
 
1
  {
2
+ "best_metric": 1.0019118785858154,
3
  "best_model_checkpoint": "fairface_age_image_detection/checkpoint-9376",
4
  "epoch": 4.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.21331058020477817,
13
+ "grad_norm": 2.756800413131714,
14
+ "learning_rate": 5.710486811065838e-06,
15
+ "loss": 1.7206,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.42662116040955633,
20
+ "grad_norm": 3.085395097732544,
21
+ "learning_rate": 5.3888054900278794e-06,
22
+ "loss": 1.3151,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.6399317406143344,
27
+ "grad_norm": 3.533961057662964,
28
+ "learning_rate": 5.067124168989921e-06,
29
+ "loss": 1.212,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.8532423208191127,
34
+ "grad_norm": 5.493643283843994,
35
+ "learning_rate": 4.745442847951962e-06,
36
+ "loss": 1.145,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 1.0,
41
+ "eval_accuracy": 0.5652,
42
+ "eval_loss": 1.115075707435608,
43
+ "eval_model_preparation_time": 0.0037,
44
+ "eval_runtime": 903.327,
45
+ "eval_samples_per_second": 11.07,
46
+ "eval_steps_per_second": 1.384,
47
  "step": 2344
48
  },
49
  {
50
  "epoch": 1.0665529010238908,
51
+ "grad_norm": 5.28899621963501,
52
+ "learning_rate": 4.423761526914004e-06,
53
+ "loss": 1.1006,
54
  "step": 2500
55
  },
56
  {
57
  "epoch": 1.2798634812286689,
58
+ "grad_norm": 6.52961540222168,
59
+ "learning_rate": 4.102080205876046e-06,
60
+ "loss": 1.0519,
61
  "step": 3000
62
  },
63
  {
64
  "epoch": 1.493174061433447,
65
+ "grad_norm": 10.652497291564941,
66
+ "learning_rate": 3.7803988848380875e-06,
67
+ "loss": 1.0292,
68
  "step": 3500
69
  },
70
  {
71
  "epoch": 1.7064846416382253,
72
+ "grad_norm": 5.245483875274658,
73
+ "learning_rate": 3.4587175638001284e-06,
74
+ "loss": 1.016,
75
  "step": 4000
76
  },
77
  {
78
  "epoch": 1.9197952218430034,
79
+ "grad_norm": 4.070522308349609,
80
+ "learning_rate": 3.1370362427621706e-06,
81
+ "loss": 1.0056,
82
  "step": 4500
83
  },
84
  {
85
  "epoch": 2.0,
86
+ "eval_accuracy": 0.5831,
87
+ "eval_loss": 1.030907392501831,
88
+ "eval_model_preparation_time": 0.0037,
89
+ "eval_runtime": 917.4025,
90
+ "eval_samples_per_second": 10.9,
91
+ "eval_steps_per_second": 1.363,
92
  "step": 4688
93
  },
94
  {
95
  "epoch": 2.1331058020477816,
96
+ "grad_norm": 6.568565845489502,
97
+ "learning_rate": 2.815354921724212e-06,
98
+ "loss": 0.9796,
99
  "step": 5000
100
  },
101
  {
102
  "epoch": 2.34641638225256,
103
+ "grad_norm": 10.742039680480957,
104
+ "learning_rate": 2.4936736006862537e-06,
105
+ "loss": 0.9587,
106
  "step": 5500
107
  },
108
  {
109
  "epoch": 2.5597269624573378,
110
+ "grad_norm": 4.3592424392700195,
111
+ "learning_rate": 2.171992279648295e-06,
112
+ "loss": 0.9455,
113
  "step": 6000
114
  },
115
  {
116
  "epoch": 2.773037542662116,
117
+ "grad_norm": 5.696556091308594,
118
+ "learning_rate": 1.8503109586103366e-06,
119
+ "loss": 0.9363,
120
  "step": 6500
121
  },
122
  {
123
  "epoch": 2.986348122866894,
124
+ "grad_norm": 5.746116638183594,
125
+ "learning_rate": 1.5286296375723786e-06,
126
+ "loss": 0.9347,
127
  "step": 7000
128
  },
129
  {
130
  "epoch": 3.0,
131
+ "eval_accuracy": 0.5883,
132
+ "eval_loss": 1.0057746171951294,
133
+ "eval_model_preparation_time": 0.0037,
134
+ "eval_runtime": 926.1536,
135
+ "eval_samples_per_second": 10.797,
136
+ "eval_steps_per_second": 1.35,
137
  "step": 7032
138
  },
139
  {
140
  "epoch": 3.1996587030716723,
141
+ "grad_norm": 4.218583106994629,
142
+ "learning_rate": 1.20694831653442e-06,
143
+ "loss": 0.9035,
144
  "step": 7500
145
  },
146
  {
147
  "epoch": 3.4129692832764507,
148
+ "grad_norm": 6.724698543548584,
149
+ "learning_rate": 8.852669954964614e-07,
150
+ "loss": 0.9081,
151
  "step": 8000
152
  },
153
  {
154
  "epoch": 3.6262798634812285,
155
+ "grad_norm": 6.658480167388916,
156
+ "learning_rate": 5.635856744585031e-07,
157
+ "loss": 0.905,
158
  "step": 8500
159
  },
160
  {
161
  "epoch": 3.839590443686007,
162
+ "grad_norm": 4.382744789123535,
163
+ "learning_rate": 2.4190435342054474e-07,
164
+ "loss": 0.8969,
165
  "step": 9000
166
  },
167
  {
168
  "epoch": 4.0,
169
+ "eval_accuracy": 0.5892,
170
+ "eval_loss": 1.0019118785858154,
171
+ "eval_model_preparation_time": 0.0037,
172
+ "eval_runtime": 929.5968,
173
+ "eval_samples_per_second": 10.757,
174
+ "eval_steps_per_second": 1.345,
175
  "step": 9376
176
  }
177
  ],
checkpoint-9376/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:50f7f93c67bf88403da8f77fa2109e270c1cad6076487c78154dcb74bbd014af
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ba8df84fa27b6ce1aa5fc9dad74c0fa9ee6fdec46d72d1f00235b986d4684db
3
  size 5304
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd3a725b1119d48b89118403515c77428316605407f871bbc7bba7fb50b32305
3
  size 343245508
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1265d8e5a8a363a615898be873c224aebc6f310654bf23b1745da0975a7b7555
3
  size 343245508
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e97ef976af56a6fd0395073925187744ad7c56829cffa99ff2332a90f94307b2
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ba8df84fa27b6ce1aa5fc9dad74c0fa9ee6fdec46d72d1f00235b986d4684db
3
  size 5304