alexbeta80 commited on
Commit
4cbbe77
·
verified ·
1 Parent(s): ef49966

End of training

Browse files
README.md CHANGED
@@ -1,6 +1,6 @@
1
  ---
2
  license: mit
3
- base_model: alexbeta80/donut-test
4
  tags:
5
  - generated_from_trainer
6
  datasets:
@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # donut-test-ddt
17
 
18
- This model is a fine-tuned version of [alexbeta80/donut-test](https://huggingface.co/alexbeta80/donut-test) on the imagefolder dataset.
19
 
20
  ## Model description
21
 
@@ -40,7 +40,7 @@ The following hyperparameters were used during training:
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
- - num_epochs: 10
44
 
45
  ### Training results
46
 
 
1
  ---
2
  license: mit
3
+ base_model: naver-clova-ix/donut-base
4
  tags:
5
  - generated_from_trainer
6
  datasets:
 
15
 
16
  # donut-test-ddt
17
 
18
+ This model is a fine-tuned version of [naver-clova-ix/donut-base](https://huggingface.co/naver-clova-ix/donut-base) on the imagefolder dataset.
19
 
20
  ## Model description
21
 
 
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
+ - num_epochs: 8
44
 
45
  ### Training results
46
 
added_tokens.json CHANGED
@@ -1,34 +1,20 @@
1
  {
2
  "</s>": 2,
3
- "</s_Consignee>": 57536,
4
- "</s_Consignee_Country>": 57533,
5
- "</s_Consignor>": 57549,
6
- "</s_Consignor_Country>": 57535,
7
- "</s_Goods_Description>": 57541,
8
- "</s_Marks>": 57548,
9
- "</s_Notify>": 57540,
10
- "</s_Notify_Country>": 57529,
11
- "</s_Second_Notify>": 57546,
12
- "</s_Second_Notify_Country>": 57532,
13
- "</s_Total_Packages>": 57550,
14
- "</s_Total_Volume>": 57547,
15
- "</s_Total_Weight>": 57544,
16
  "<mask>": 57521,
17
  "<pad>": 1,
18
  "<s>": 0,
19
- "<s_Consignee>": 57545,
20
- "<s_Consignee_Country>": 57528,
21
- "<s_Consignor>": 57530,
22
- "<s_Consignor_Country>": 57527,
23
- "<s_Goods_Description>": 57534,
24
- "<s_Marks>": 57538,
25
- "<s_Notify>": 57525,
26
- "<s_Notify_Country>": 57531,
27
- "<s_Second_Notify>": 57542,
28
- "<s_Second_Notify_Country>": 57537,
29
- "<s_Total_Packages>": 57526,
30
- "<s_Total_Volume>": 57543,
31
- "<s_Total_Weight>": 57539,
32
  "<s_iitcdip>": 57523,
33
  "<s_synthdog>": 57524,
34
  "<sep/>": 57522,
 
1
  {
2
  "</s>": 2,
3
+ "</s_Codici>": 57531,
4
+ "</s_Data>": 57536,
5
+ "</s_Fornitore>": 57533,
6
+ "</s_Numero>": 57529,
7
+ "</s_Posizioni>": 57530,
8
+ "</s_Quantita>": 57528,
 
 
 
 
 
 
 
9
  "<mask>": 57521,
10
  "<pad>": 1,
11
  "<s>": 0,
12
+ "<s_Codici>": 57527,
13
+ "<s_Data>": 57526,
14
+ "<s_Fornitore>": 57535,
15
+ "<s_Numero>": 57534,
16
+ "<s_Posizioni>": 57525,
17
+ "<s_Quantita>": 57532,
 
 
 
 
 
 
 
18
  "<s_iitcdip>": 57523,
19
  "<s_synthdog>": 57524,
20
  "<sep/>": 57522,
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "alexbeta80/donut-test",
3
  "architectures": [
4
  "VisionEncoderDecoderModel"
5
  ],
@@ -85,7 +85,7 @@
85
  "typical_p": 1.0,
86
  "use_bfloat16": false,
87
  "use_cache": true,
88
- "vocab_size": 57551
89
  },
90
  "decoder_start_token_id": 0,
91
  "encoder": {
@@ -124,8 +124,8 @@
124
  "1": "LABEL_1"
125
  },
126
  "image_size": [
127
- 1169,
128
- 827
129
  ],
130
  "initializer_range": 0.02,
131
  "is_decoder": false,
 
1
  {
2
+ "_name_or_path": "naver-clova-ix/donut-base",
3
  "architectures": [
4
  "VisionEncoderDecoderModel"
5
  ],
 
85
  "typical_p": 1.0,
86
  "use_bfloat16": false,
87
  "use_cache": true,
88
+ "vocab_size": 57537
89
  },
90
  "decoder_start_token_id": 0,
91
  "encoder": {
 
124
  "1": "LABEL_1"
125
  },
126
  "image_size": [
127
+ 700,
128
+ 520
129
  ],
130
  "initializer_range": 0.02,
131
  "is_decoder": false,
generation_config.json CHANGED
@@ -1,10 +1,8 @@
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
- "decoder_start_token_id": 0,
5
  "eos_token_id": 2,
6
  "forced_eos_token_id": 2,
7
- "max_length": 512,
8
  "pad_token_id": 1,
9
  "transformers_version": "4.34.0"
10
  }
 
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
 
4
  "eos_token_id": 2,
5
  "forced_eos_token_id": 2,
 
6
  "pad_token_id": 1,
7
  "transformers_version": "4.34.0"
8
  }
preprocessor_config.json CHANGED
@@ -19,8 +19,8 @@
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
- "size": {
23
- "height": 1169,
24
- "width": 827
25
- }
26
  }
 
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
+ "size": [
23
+ 520,
24
+ 700
25
+ ]
26
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17e96dcdcf9a2aced71e90c4991db40b87bd3e51312835f729dc5ce38c8777e6
3
- size 809285846
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5470c283cff8de1c4095140891f380a5e2774fe2278a27b30269dca234488ae
3
+ size 809228502
special_tokens_map.json CHANGED
@@ -1,38 +1,21 @@
1
  {
2
  "additional_special_tokens": [
3
- "<s>",
4
- "<pad>",
5
- "</s>",
6
- "<unk>",
7
- "<mask>",
8
  "<s_iitcdip>",
9
  "<s_synthdog>",
10
- "<s_Notify>",
11
- "<s_Total_Packages>",
12
- "<s_Consignor_Country>",
13
- "<s_Consignee_Country>",
14
- "</s_Notify_Country>",
15
- "<s_Consignor>",
16
- "<s_Notify_Country>",
17
- "</s_Second_Notify_Country>",
18
- "</s_Consignee_Country>",
19
- "<s_Goods_Description>",
20
- "</s_Consignor_Country>",
21
- "</s_Consignee>",
22
- "<s_Second_Notify_Country>",
23
- "<s_Marks>",
24
- "<s_Total_Weight>",
25
- "</s_Notify>",
26
- "</s_Goods_Description>",
27
- "<s_Second_Notify>",
28
- "<s_Total_Volume>",
29
- "</s_Total_Weight>",
30
- "<s_Consignee>",
31
- "</s_Second_Notify>",
32
- "</s_Total_Volume>",
33
- "</s_Marks>",
34
- "</s_Consignor>",
35
- "</s_Total_Packages>"
36
  ],
37
  "bos_token": "<s>",
38
  "cls_token": "<s>",
 
1
  {
2
  "additional_special_tokens": [
 
 
 
 
 
3
  "<s_iitcdip>",
4
  "<s_synthdog>",
5
+ "<s_Posizioni>",
6
+ "<s_Data>",
7
+ "<s_Codici>",
8
+ "</s>",
9
+ "</s_Quantita>",
10
+ "</s_Numero>",
11
+ "</s_Posizioni>",
12
+ "</s_Codici>",
13
+ "<s_Quantita>",
14
+ "</s_Fornitore>",
15
+ "<s_Numero>",
16
+ "<s_Fornitore>",
17
+ "<s>",
18
+ "</s_Data>"
 
 
 
 
 
 
 
 
 
 
 
 
19
  ],
20
  "bos_token": "<s>",
21
  "cls_token": "<s>",
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -2,9 +2,9 @@
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<s>",
5
- "lstrip": false,
6
  "normalized": false,
7
- "rstrip": false,
8
  "single_word": false,
9
  "special": true
10
  },
@@ -18,9 +18,9 @@
18
  },
19
  "2": {
20
  "content": "</s>",
21
- "lstrip": false,
22
  "normalized": false,
23
- "rstrip": false,
24
  "single_word": false,
25
  "special": true
26
  },
@@ -35,7 +35,7 @@
35
  "57521": {
36
  "content": "<mask>",
37
  "lstrip": true,
38
- "normalized": false,
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
@@ -65,7 +65,7 @@
65
  "special": true
66
  },
67
  "57525": {
68
- "content": "<s_Notify>",
69
  "lstrip": true,
70
  "normalized": false,
71
  "rstrip": true,
@@ -73,7 +73,7 @@
73
  "special": true
74
  },
75
  "57526": {
76
- "content": "<s_Total_Packages>",
77
  "lstrip": true,
78
  "normalized": false,
79
  "rstrip": true,
@@ -81,7 +81,7 @@
81
  "special": true
82
  },
83
  "57527": {
84
- "content": "<s_Consignor_Country>",
85
  "lstrip": true,
86
  "normalized": false,
87
  "rstrip": true,
@@ -89,7 +89,7 @@
89
  "special": true
90
  },
91
  "57528": {
92
- "content": "<s_Consignee_Country>",
93
  "lstrip": true,
94
  "normalized": false,
95
  "rstrip": true,
@@ -97,7 +97,7 @@
97
  "special": true
98
  },
99
  "57529": {
100
- "content": "</s_Notify_Country>",
101
  "lstrip": true,
102
  "normalized": false,
103
  "rstrip": true,
@@ -105,7 +105,7 @@
105
  "special": true
106
  },
107
  "57530": {
108
- "content": "<s_Consignor>",
109
  "lstrip": true,
110
  "normalized": false,
111
  "rstrip": true,
@@ -113,7 +113,7 @@
113
  "special": true
114
  },
115
  "57531": {
116
- "content": "<s_Notify_Country>",
117
  "lstrip": true,
118
  "normalized": false,
119
  "rstrip": true,
@@ -121,7 +121,7 @@
121
  "special": true
122
  },
123
  "57532": {
124
- "content": "</s_Second_Notify_Country>",
125
  "lstrip": true,
126
  "normalized": false,
127
  "rstrip": true,
@@ -129,7 +129,7 @@
129
  "special": true
130
  },
131
  "57533": {
132
- "content": "</s_Consignee_Country>",
133
  "lstrip": true,
134
  "normalized": false,
135
  "rstrip": true,
@@ -137,7 +137,7 @@
137
  "special": true
138
  },
139
  "57534": {
140
- "content": "<s_Goods_Description>",
141
  "lstrip": true,
142
  "normalized": false,
143
  "rstrip": true,
@@ -145,7 +145,7 @@
145
  "special": true
146
  },
147
  "57535": {
148
- "content": "</s_Consignor_Country>",
149
  "lstrip": true,
150
  "normalized": false,
151
  "rstrip": true,
@@ -153,119 +153,7 @@
153
  "special": true
154
  },
155
  "57536": {
156
- "content": "</s_Consignee>",
157
- "lstrip": true,
158
- "normalized": false,
159
- "rstrip": true,
160
- "single_word": false,
161
- "special": true
162
- },
163
- "57537": {
164
- "content": "<s_Second_Notify_Country>",
165
- "lstrip": true,
166
- "normalized": false,
167
- "rstrip": true,
168
- "single_word": false,
169
- "special": true
170
- },
171
- "57538": {
172
- "content": "<s_Marks>",
173
- "lstrip": true,
174
- "normalized": false,
175
- "rstrip": true,
176
- "single_word": false,
177
- "special": true
178
- },
179
- "57539": {
180
- "content": "<s_Total_Weight>",
181
- "lstrip": true,
182
- "normalized": false,
183
- "rstrip": true,
184
- "single_word": false,
185
- "special": true
186
- },
187
- "57540": {
188
- "content": "</s_Notify>",
189
- "lstrip": true,
190
- "normalized": false,
191
- "rstrip": true,
192
- "single_word": false,
193
- "special": true
194
- },
195
- "57541": {
196
- "content": "</s_Goods_Description>",
197
- "lstrip": true,
198
- "normalized": false,
199
- "rstrip": true,
200
- "single_word": false,
201
- "special": true
202
- },
203
- "57542": {
204
- "content": "<s_Second_Notify>",
205
- "lstrip": true,
206
- "normalized": false,
207
- "rstrip": true,
208
- "single_word": false,
209
- "special": true
210
- },
211
- "57543": {
212
- "content": "<s_Total_Volume>",
213
- "lstrip": true,
214
- "normalized": false,
215
- "rstrip": true,
216
- "single_word": false,
217
- "special": true
218
- },
219
- "57544": {
220
- "content": "</s_Total_Weight>",
221
- "lstrip": true,
222
- "normalized": false,
223
- "rstrip": true,
224
- "single_word": false,
225
- "special": true
226
- },
227
- "57545": {
228
- "content": "<s_Consignee>",
229
- "lstrip": true,
230
- "normalized": false,
231
- "rstrip": true,
232
- "single_word": false,
233
- "special": true
234
- },
235
- "57546": {
236
- "content": "</s_Second_Notify>",
237
- "lstrip": true,
238
- "normalized": false,
239
- "rstrip": true,
240
- "single_word": false,
241
- "special": true
242
- },
243
- "57547": {
244
- "content": "</s_Total_Volume>",
245
- "lstrip": true,
246
- "normalized": false,
247
- "rstrip": true,
248
- "single_word": false,
249
- "special": true
250
- },
251
- "57548": {
252
- "content": "</s_Marks>",
253
- "lstrip": true,
254
- "normalized": false,
255
- "rstrip": true,
256
- "single_word": false,
257
- "special": true
258
- },
259
- "57549": {
260
- "content": "</s_Consignor>",
261
- "lstrip": true,
262
- "normalized": false,
263
- "rstrip": true,
264
- "single_word": false,
265
- "special": true
266
- },
267
- "57550": {
268
- "content": "</s_Total_Packages>",
269
  "lstrip": true,
270
  "normalized": false,
271
  "rstrip": true,
@@ -274,57 +162,33 @@
274
  }
275
  },
276
  "additional_special_tokens": [
277
- "<s>",
278
- "<pad>",
279
- "</s>",
280
- "<unk>",
281
- "<mask>",
282
  "<s_iitcdip>",
283
  "<s_synthdog>",
284
- "<s_Notify>",
285
- "<s_Total_Packages>",
286
- "<s_Consignor_Country>",
287
- "<s_Consignee_Country>",
288
- "</s_Notify_Country>",
289
- "<s_Consignor>",
290
- "<s_Notify_Country>",
291
- "</s_Second_Notify_Country>",
292
- "</s_Consignee_Country>",
293
- "<s_Goods_Description>",
294
- "</s_Consignor_Country>",
295
- "</s_Consignee>",
296
- "<s_Second_Notify_Country>",
297
- "<s_Marks>",
298
- "<s_Total_Weight>",
299
- "</s_Notify>",
300
- "</s_Goods_Description>",
301
- "<s_Second_Notify>",
302
- "<s_Total_Volume>",
303
- "</s_Total_Weight>",
304
- "<s_Consignee>",
305
- "</s_Second_Notify>",
306
- "</s_Total_Volume>",
307
- "</s_Marks>",
308
- "</s_Consignor>",
309
- "</s_Total_Packages>"
310
  ],
311
  "bos_token": "<s>",
312
  "clean_up_tokenization_spaces": true,
313
  "cls_token": "<s>",
314
  "eos_token": "</s>",
315
  "mask_token": "<mask>",
316
- "max_length": 512,
317
  "model_max_length": 1000000000000000019884624838656,
318
- "pad_to_multiple_of": null,
319
  "pad_token": "<pad>",
320
- "pad_token_type_id": 0,
321
- "padding_side": "right",
322
  "processor_class": "DonutProcessor",
323
  "sep_token": "</s>",
324
  "sp_model_kwargs": {},
325
- "stride": 0,
326
  "tokenizer_class": "XLMRobertaTokenizer",
327
- "truncation_side": "right",
328
- "truncation_strategy": "longest_first",
329
  "unk_token": "<unk>"
330
  }
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<s>",
5
+ "lstrip": true,
6
  "normalized": false,
7
+ "rstrip": true,
8
  "single_word": false,
9
  "special": true
10
  },
 
18
  },
19
  "2": {
20
  "content": "</s>",
21
+ "lstrip": true,
22
  "normalized": false,
23
+ "rstrip": true,
24
  "single_word": false,
25
  "special": true
26
  },
 
35
  "57521": {
36
  "content": "<mask>",
37
  "lstrip": true,
38
+ "normalized": true,
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
 
65
  "special": true
66
  },
67
  "57525": {
68
+ "content": "<s_Posizioni>",
69
  "lstrip": true,
70
  "normalized": false,
71
  "rstrip": true,
 
73
  "special": true
74
  },
75
  "57526": {
76
+ "content": "<s_Data>",
77
  "lstrip": true,
78
  "normalized": false,
79
  "rstrip": true,
 
81
  "special": true
82
  },
83
  "57527": {
84
+ "content": "<s_Codici>",
85
  "lstrip": true,
86
  "normalized": false,
87
  "rstrip": true,
 
89
  "special": true
90
  },
91
  "57528": {
92
+ "content": "</s_Quantita>",
93
  "lstrip": true,
94
  "normalized": false,
95
  "rstrip": true,
 
97
  "special": true
98
  },
99
  "57529": {
100
+ "content": "</s_Numero>",
101
  "lstrip": true,
102
  "normalized": false,
103
  "rstrip": true,
 
105
  "special": true
106
  },
107
  "57530": {
108
+ "content": "</s_Posizioni>",
109
  "lstrip": true,
110
  "normalized": false,
111
  "rstrip": true,
 
113
  "special": true
114
  },
115
  "57531": {
116
+ "content": "</s_Codici>",
117
  "lstrip": true,
118
  "normalized": false,
119
  "rstrip": true,
 
121
  "special": true
122
  },
123
  "57532": {
124
+ "content": "<s_Quantita>",
125
  "lstrip": true,
126
  "normalized": false,
127
  "rstrip": true,
 
129
  "special": true
130
  },
131
  "57533": {
132
+ "content": "</s_Fornitore>",
133
  "lstrip": true,
134
  "normalized": false,
135
  "rstrip": true,
 
137
  "special": true
138
  },
139
  "57534": {
140
+ "content": "<s_Numero>",
141
  "lstrip": true,
142
  "normalized": false,
143
  "rstrip": true,
 
145
  "special": true
146
  },
147
  "57535": {
148
+ "content": "<s_Fornitore>",
149
  "lstrip": true,
150
  "normalized": false,
151
  "rstrip": true,
 
153
  "special": true
154
  },
155
  "57536": {
156
+ "content": "</s_Data>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
157
  "lstrip": true,
158
  "normalized": false,
159
  "rstrip": true,
 
162
  }
163
  },
164
  "additional_special_tokens": [
 
 
 
 
 
165
  "<s_iitcdip>",
166
  "<s_synthdog>",
167
+ "<s_Posizioni>",
168
+ "<s_Data>",
169
+ "<s_Codici>",
170
+ "</s>",
171
+ "</s_Quantita>",
172
+ "</s_Numero>",
173
+ "</s_Posizioni>",
174
+ "</s_Codici>",
175
+ "<s_Quantita>",
176
+ "</s_Fornitore>",
177
+ "<s_Numero>",
178
+ "<s_Fornitore>",
179
+ "<s>",
180
+ "</s_Data>"
 
 
 
 
 
 
 
 
 
 
 
 
181
  ],
182
  "bos_token": "<s>",
183
  "clean_up_tokenization_spaces": true,
184
  "cls_token": "<s>",
185
  "eos_token": "</s>",
186
  "mask_token": "<mask>",
 
187
  "model_max_length": 1000000000000000019884624838656,
 
188
  "pad_token": "<pad>",
 
 
189
  "processor_class": "DonutProcessor",
190
  "sep_token": "</s>",
191
  "sp_model_kwargs": {},
 
192
  "tokenizer_class": "XLMRobertaTokenizer",
 
 
193
  "unk_token": "<unk>"
194
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c5d2c1f955567456d8485e5d41d98208e55524d44111b76444f3a7eead18c68
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ed308013c1c7b71d331e7af16d7ef386cd223ba7455751efed12a5f11afd8a5
3
  size 4664