dodogeny commited on
Commit
f0c0fb0
1 Parent(s): 80856eb

End of training

Browse files
README.md CHANGED
@@ -40,7 +40,6 @@ The following hyperparameters were used during training:
40
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
41
  - lr_scheduler_type: linear
42
  - num_epochs: 3
43
- - mixed_precision_training: Native AMP
44
 
45
  ### Training results
46
 
@@ -48,7 +47,7 @@ The following hyperparameters were used during training:
48
 
49
  ### Framework versions
50
 
51
- - Transformers 4.23.1
52
- - Pytorch 1.12.1+cu113
53
- - Datasets 2.6.1
54
- - Tokenizers 0.13.1
 
40
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
41
  - lr_scheduler_type: linear
42
  - num_epochs: 3
 
43
 
44
  ### Training results
45
 
 
47
 
48
  ### Framework versions
49
 
50
+ - Transformers 4.26.0.dev0
51
+ - Pytorch 1.13.0+cu116
52
+ - Datasets 2.8.0
53
+ - Tokenizers 0.13.2
added_tokens.json CHANGED
@@ -1,19 +1,25 @@
1
  {
2
- "</s_address>": 57585,
 
3
  "</s_cashprice>": 57549,
 
4
  "</s_changeprice>": 57551,
5
  "</s_cnt>": 57529,
6
- "</s_company>": 57583,
7
  "</s_creditcardprice>": 57563,
8
- "</s_date>": 57581,
9
  "</s_discount_price>": 57557,
10
  "</s_discountprice>": 57567,
 
11
  "</s_emoneyprice>": 57569,
12
  "</s_etc>": 57541,
 
13
  "</s_itemsubtotal>": 57577,
 
14
  "</s_menu>": 57525,
15
  "</s_menuqty_cnt>": 57555,
16
  "</s_menutype_cnt>": 57553,
 
17
  "</s_nm>": 57527,
18
  "</s_num>": 57565,
19
  "</s_othersvc_price>": 57573,
@@ -23,29 +29,36 @@
23
  "</s_sub_total>": 57533,
24
  "</s_subtotal_price>": 57535,
25
  "</s_tax_price>": 57539,
 
26
  "</s_total>": 57543,
27
  "</s_total_etc>": 57561,
28
  "</s_total_price>": 57545,
29
  "</s_unitprice>": 57559,
30
  "</s_vatyn>": 57575,
31
  "</s_void_menu>": 57571,
32
- "<s_address>": 57584,
 
33
  "<s_cashprice>": 57550,
 
34
  "<s_changeprice>": 57552,
35
  "<s_cnt>": 57530,
36
- "<s_company>": 57582,
37
  "<s_cord-v2>": 57579,
38
  "<s_creditcardprice>": 57564,
39
- "<s_date>": 57580,
40
  "<s_discount_price>": 57558,
41
  "<s_discountprice>": 57568,
 
42
  "<s_emoneyprice>": 57570,
43
  "<s_etc>": 57542,
 
44
  "<s_iitcdip>": 57523,
45
  "<s_itemsubtotal>": 57578,
 
46
  "<s_menu>": 57526,
47
  "<s_menuqty_cnt>": 57556,
48
  "<s_menutype_cnt>": 57554,
 
49
  "<s_nm>": 57528,
50
  "<s_num>": 57566,
51
  "<s_othersvc_price>": 57574,
@@ -56,6 +69,7 @@
56
  "<s_subtotal_price>": 57536,
57
  "<s_synthdog>": 57524,
58
  "<s_tax_price>": 57540,
 
59
  "<s_total>": 57544,
60
  "<s_total_etc>": 57562,
61
  "<s_total_price>": 57546,
 
1
  {
2
+ "</s_address>": 57599,
3
+ "</s_cash>": 57583,
4
  "</s_cashprice>": 57549,
5
+ "</s_change>": 57581,
6
  "</s_changeprice>": 57551,
7
  "</s_cnt>": 57529,
8
+ "</s_company>": 57597,
9
  "</s_creditcardprice>": 57563,
10
+ "</s_date>": 57595,
11
  "</s_discount_price>": 57557,
12
  "</s_discountprice>": 57567,
13
+ "</s_email>": 57593,
14
  "</s_emoneyprice>": 57569,
15
  "</s_etc>": 57541,
16
+ "</s_fax>": 57591,
17
  "</s_itemsubtotal>": 57577,
18
+ "</s_lineNumber>": 57589,
19
  "</s_menu>": 57525,
20
  "</s_menuqty_cnt>": 57555,
21
  "</s_menutype_cnt>": 57553,
22
+ "</s_merchant>": 57587,
23
  "</s_nm>": 57527,
24
  "</s_num>": 57565,
25
  "</s_othersvc_price>": 57573,
 
29
  "</s_sub_total>": 57533,
30
  "</s_subtotal_price>": 57535,
31
  "</s_tax_price>": 57539,
32
+ "</s_tel>": 57585,
33
  "</s_total>": 57543,
34
  "</s_total_etc>": 57561,
35
  "</s_total_price>": 57545,
36
  "</s_unitprice>": 57559,
37
  "</s_vatyn>": 57575,
38
  "</s_void_menu>": 57571,
39
+ "<s_address>": 57598,
40
+ "<s_cash>": 57582,
41
  "<s_cashprice>": 57550,
42
+ "<s_change>": 57580,
43
  "<s_changeprice>": 57552,
44
  "<s_cnt>": 57530,
45
+ "<s_company>": 57596,
46
  "<s_cord-v2>": 57579,
47
  "<s_creditcardprice>": 57564,
48
+ "<s_date>": 57594,
49
  "<s_discount_price>": 57558,
50
  "<s_discountprice>": 57568,
51
+ "<s_email>": 57592,
52
  "<s_emoneyprice>": 57570,
53
  "<s_etc>": 57542,
54
+ "<s_fax>": 57590,
55
  "<s_iitcdip>": 57523,
56
  "<s_itemsubtotal>": 57578,
57
+ "<s_lineNumber>": 57588,
58
  "<s_menu>": 57526,
59
  "<s_menuqty_cnt>": 57556,
60
  "<s_menutype_cnt>": 57554,
61
+ "<s_merchant>": 57586,
62
  "<s_nm>": 57528,
63
  "<s_num>": 57566,
64
  "<s_othersvc_price>": 57574,
 
69
  "<s_subtotal_price>": 57536,
70
  "<s_synthdog>": 57524,
71
  "<s_tax_price>": 57540,
72
+ "<s_tel>": 57584,
73
  "<s_total>": 57544,
74
  "<s_total_etc>": 57562,
75
  "<s_total_price>": 57546,
preprocessor_config.json CHANGED
@@ -2,14 +2,15 @@
2
  "do_align_long_axis": false,
3
  "do_normalize": true,
4
  "do_pad": true,
 
5
  "do_resize": true,
6
  "do_thumbnail": true,
7
- "feature_extractor_type": "DonutFeatureExtractor",
8
  "image_mean": [
9
  0.5,
10
  0.5,
11
  0.5
12
  ],
 
13
  "image_std": [
14
  0.5,
15
  0.5,
@@ -17,6 +18,7 @@
17
  ],
18
  "processor_class": "DonutProcessor",
19
  "resample": 2,
 
20
  "size": [
21
  720,
22
  960
 
2
  "do_align_long_axis": false,
3
  "do_normalize": true,
4
  "do_pad": true,
5
+ "do_rescale": true,
6
  "do_resize": true,
7
  "do_thumbnail": true,
 
8
  "image_mean": [
9
  0.5,
10
  0.5,
11
  0.5
12
  ],
13
+ "image_processor_type": "DonutImageProcessor",
14
  "image_std": [
15
  0.5,
16
  0.5,
 
18
  ],
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
+ "rescale_factor": 0.00392156862745098,
22
  "size": [
23
  720,
24
  960
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f968e50c4d6d10032f1dbb4ab8d224a298e5049ba06790ed65220ba9ecfbf69c
3
  size 806333657
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eeff45a90481fda3e2dea66c3fb498065486beb524d2ddd3ec39f71e1320a429
3
  size 806333657
runs/Jan02_17-53-43_0c15e67d1a0b/events.out.tfevents.1672682410.0c15e67d1a0b.879.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23ae97becf7788d35209fe081fa91c7436d576d6428e92a73c79e8ae86f65e11
3
- size 8710
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:102af906ba35c84847edbc5f0dcfe93f472980170de53f4f9d23e70aaec065ec
3
+ size 10006
special_tokens_map.json CHANGED
@@ -4,24 +4,38 @@
4
  "</s_total>",
5
  "<s_total_price>",
6
  "</s_total_price>",
7
- "<s_changeprice>",
8
- "</s_changeprice>",
9
- "<s_cashprice>",
10
- "</s_cashprice>",
 
 
 
 
11
  "<s_sub_total>",
12
  "</s_sub_total>",
13
- "<s_subtotal_price>",
14
- "</s_subtotal_price>",
 
 
 
 
 
 
 
 
15
  "<s_menu>",
16
  "</s_menu>",
17
- "<s_unitprice>",
18
- "</s_unitprice>",
19
- "<s_price>",
20
- "</s_price>",
21
  "<s_nm>",
22
  "</s_nm>",
 
 
23
  "<s_cnt>",
24
  "</s_cnt>",
 
 
 
 
25
  "<s_date>",
26
  "</s_date>",
27
  "<s_company>",
 
4
  "</s_total>",
5
  "<s_total_price>",
6
  "</s_total_price>",
7
+ "<s_price>",
8
+ "</s_price>",
9
+ "<s_change>",
10
+ "</s_change>",
11
+ "<s_cash>",
12
+ "</s_cash>",
13
+ "<s_tel>",
14
+ "</s_tel>",
15
  "<s_sub_total>",
16
  "</s_sub_total>",
17
+ "<s_tax_price>",
18
+ "</s_tax_price>",
19
+ "<s_service_price>",
20
+ "</s_service_price>",
21
+ "<s_etc>",
22
+ "</s_etc>",
23
+ "<s_discount_price>",
24
+ "</s_discount_price>",
25
+ "<s_merchant>",
26
+ "</s_merchant>",
27
  "<s_menu>",
28
  "</s_menu>",
 
 
 
 
29
  "<s_nm>",
30
  "</s_nm>",
31
+ "<s_lineNumber>",
32
+ "</s_lineNumber>",
33
  "<s_cnt>",
34
  "</s_cnt>",
35
+ "<s_fax>",
36
+ "</s_fax>",
37
+ "<s_email>",
38
+ "</s_email>",
39
  "<s_date>",
40
  "</s_date>",
41
  "<s_company>",
tokenizer.json CHANGED
@@ -185,8 +185,8 @@
185
  "single_word": false,
186
  "lstrip": false,
187
  "rstrip": false,
188
- "normalized": false,
189
- "special": true
190
  },
191
  {
192
  "id": 57536,
@@ -194,8 +194,8 @@
194
  "single_word": false,
195
  "lstrip": false,
196
  "rstrip": false,
197
- "normalized": false,
198
- "special": true
199
  },
200
  {
201
  "id": 57537,
@@ -203,8 +203,8 @@
203
  "single_word": false,
204
  "lstrip": false,
205
  "rstrip": false,
206
- "normalized": true,
207
- "special": false
208
  },
209
  {
210
  "id": 57538,
@@ -212,8 +212,8 @@
212
  "single_word": false,
213
  "lstrip": false,
214
  "rstrip": false,
215
- "normalized": true,
216
- "special": false
217
  },
218
  {
219
  "id": 57539,
@@ -221,8 +221,8 @@
221
  "single_word": false,
222
  "lstrip": false,
223
  "rstrip": false,
224
- "normalized": true,
225
- "special": false
226
  },
227
  {
228
  "id": 57540,
@@ -230,8 +230,8 @@
230
  "single_word": false,
231
  "lstrip": false,
232
  "rstrip": false,
233
- "normalized": true,
234
- "special": false
235
  },
236
  {
237
  "id": 57541,
@@ -239,8 +239,8 @@
239
  "single_word": false,
240
  "lstrip": false,
241
  "rstrip": false,
242
- "normalized": true,
243
- "special": false
244
  },
245
  {
246
  "id": 57542,
@@ -248,8 +248,8 @@
248
  "single_word": false,
249
  "lstrip": false,
250
  "rstrip": false,
251
- "normalized": true,
252
- "special": false
253
  },
254
  {
255
  "id": 57543,
@@ -311,8 +311,8 @@
311
  "single_word": false,
312
  "lstrip": false,
313
  "rstrip": false,
314
- "normalized": false,
315
- "special": true
316
  },
317
  {
318
  "id": 57550,
@@ -320,8 +320,8 @@
320
  "single_word": false,
321
  "lstrip": false,
322
  "rstrip": false,
323
- "normalized": false,
324
- "special": true
325
  },
326
  {
327
  "id": 57551,
@@ -329,8 +329,8 @@
329
  "single_word": false,
330
  "lstrip": false,
331
  "rstrip": false,
332
- "normalized": false,
333
- "special": true
334
  },
335
  {
336
  "id": 57552,
@@ -338,8 +338,8 @@
338
  "single_word": false,
339
  "lstrip": false,
340
  "rstrip": false,
341
- "normalized": false,
342
- "special": true
343
  },
344
  {
345
  "id": 57553,
@@ -383,8 +383,8 @@
383
  "single_word": false,
384
  "lstrip": false,
385
  "rstrip": false,
386
- "normalized": true,
387
- "special": false
388
  },
389
  {
390
  "id": 57558,
@@ -392,8 +392,8 @@
392
  "single_word": false,
393
  "lstrip": false,
394
  "rstrip": false,
395
- "normalized": true,
396
- "special": false
397
  },
398
  {
399
  "id": 57559,
@@ -401,8 +401,8 @@
401
  "single_word": false,
402
  "lstrip": false,
403
  "rstrip": false,
404
- "normalized": false,
405
- "special": true
406
  },
407
  {
408
  "id": 57560,
@@ -410,8 +410,8 @@
410
  "single_word": false,
411
  "lstrip": false,
412
  "rstrip": false,
413
- "normalized": false,
414
- "special": true
415
  },
416
  {
417
  "id": 57561,
@@ -586,7 +586,7 @@
586
  },
587
  {
588
  "id": 57580,
589
- "content": "<s_date>",
590
  "single_word": false,
591
  "lstrip": false,
592
  "rstrip": false,
@@ -595,7 +595,7 @@
595
  },
596
  {
597
  "id": 57581,
598
- "content": "</s_date>",
599
  "single_word": false,
600
  "lstrip": false,
601
  "rstrip": false,
@@ -604,7 +604,7 @@
604
  },
605
  {
606
  "id": 57582,
607
- "content": "<s_company>",
608
  "single_word": false,
609
  "lstrip": false,
610
  "rstrip": false,
@@ -613,7 +613,7 @@
613
  },
614
  {
615
  "id": 57583,
616
- "content": "</s_company>",
617
  "single_word": false,
618
  "lstrip": false,
619
  "rstrip": false,
@@ -622,7 +622,7 @@
622
  },
623
  {
624
  "id": 57584,
625
- "content": "<s_address>",
626
  "single_word": false,
627
  "lstrip": false,
628
  "rstrip": false,
@@ -631,6 +631,132 @@
631
  },
632
  {
633
  "id": 57585,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
634
  "content": "</s_address>",
635
  "single_word": false,
636
  "lstrip": false,
 
185
  "single_word": false,
186
  "lstrip": false,
187
  "rstrip": false,
188
+ "normalized": true,
189
+ "special": false
190
  },
191
  {
192
  "id": 57536,
 
194
  "single_word": false,
195
  "lstrip": false,
196
  "rstrip": false,
197
+ "normalized": true,
198
+ "special": false
199
  },
200
  {
201
  "id": 57537,
 
203
  "single_word": false,
204
  "lstrip": false,
205
  "rstrip": false,
206
+ "normalized": false,
207
+ "special": true
208
  },
209
  {
210
  "id": 57538,
 
212
  "single_word": false,
213
  "lstrip": false,
214
  "rstrip": false,
215
+ "normalized": false,
216
+ "special": true
217
  },
218
  {
219
  "id": 57539,
 
221
  "single_word": false,
222
  "lstrip": false,
223
  "rstrip": false,
224
+ "normalized": false,
225
+ "special": true
226
  },
227
  {
228
  "id": 57540,
 
230
  "single_word": false,
231
  "lstrip": false,
232
  "rstrip": false,
233
+ "normalized": false,
234
+ "special": true
235
  },
236
  {
237
  "id": 57541,
 
239
  "single_word": false,
240
  "lstrip": false,
241
  "rstrip": false,
242
+ "normalized": false,
243
+ "special": true
244
  },
245
  {
246
  "id": 57542,
 
248
  "single_word": false,
249
  "lstrip": false,
250
  "rstrip": false,
251
+ "normalized": false,
252
+ "special": true
253
  },
254
  {
255
  "id": 57543,
 
311
  "single_word": false,
312
  "lstrip": false,
313
  "rstrip": false,
314
+ "normalized": true,
315
+ "special": false
316
  },
317
  {
318
  "id": 57550,
 
320
  "single_word": false,
321
  "lstrip": false,
322
  "rstrip": false,
323
+ "normalized": true,
324
+ "special": false
325
  },
326
  {
327
  "id": 57551,
 
329
  "single_word": false,
330
  "lstrip": false,
331
  "rstrip": false,
332
+ "normalized": true,
333
+ "special": false
334
  },
335
  {
336
  "id": 57552,
 
338
  "single_word": false,
339
  "lstrip": false,
340
  "rstrip": false,
341
+ "normalized": true,
342
+ "special": false
343
  },
344
  {
345
  "id": 57553,
 
383
  "single_word": false,
384
  "lstrip": false,
385
  "rstrip": false,
386
+ "normalized": false,
387
+ "special": true
388
  },
389
  {
390
  "id": 57558,
 
392
  "single_word": false,
393
  "lstrip": false,
394
  "rstrip": false,
395
+ "normalized": false,
396
+ "special": true
397
  },
398
  {
399
  "id": 57559,
 
401
  "single_word": false,
402
  "lstrip": false,
403
  "rstrip": false,
404
+ "normalized": true,
405
+ "special": false
406
  },
407
  {
408
  "id": 57560,
 
410
  "single_word": false,
411
  "lstrip": false,
412
  "rstrip": false,
413
+ "normalized": true,
414
+ "special": false
415
  },
416
  {
417
  "id": 57561,
 
586
  },
587
  {
588
  "id": 57580,
589
+ "content": "<s_change>",
590
  "single_word": false,
591
  "lstrip": false,
592
  "rstrip": false,
 
595
  },
596
  {
597
  "id": 57581,
598
+ "content": "</s_change>",
599
  "single_word": false,
600
  "lstrip": false,
601
  "rstrip": false,
 
604
  },
605
  {
606
  "id": 57582,
607
+ "content": "<s_cash>",
608
  "single_word": false,
609
  "lstrip": false,
610
  "rstrip": false,
 
613
  },
614
  {
615
  "id": 57583,
616
+ "content": "</s_cash>",
617
  "single_word": false,
618
  "lstrip": false,
619
  "rstrip": false,
 
622
  },
623
  {
624
  "id": 57584,
625
+ "content": "<s_tel>",
626
  "single_word": false,
627
  "lstrip": false,
628
  "rstrip": false,
 
631
  },
632
  {
633
  "id": 57585,
634
+ "content": "</s_tel>",
635
+ "single_word": false,
636
+ "lstrip": false,
637
+ "rstrip": false,
638
+ "normalized": false,
639
+ "special": true
640
+ },
641
+ {
642
+ "id": 57586,
643
+ "content": "<s_merchant>",
644
+ "single_word": false,
645
+ "lstrip": false,
646
+ "rstrip": false,
647
+ "normalized": false,
648
+ "special": true
649
+ },
650
+ {
651
+ "id": 57587,
652
+ "content": "</s_merchant>",
653
+ "single_word": false,
654
+ "lstrip": false,
655
+ "rstrip": false,
656
+ "normalized": false,
657
+ "special": true
658
+ },
659
+ {
660
+ "id": 57588,
661
+ "content": "<s_lineNumber>",
662
+ "single_word": false,
663
+ "lstrip": false,
664
+ "rstrip": false,
665
+ "normalized": false,
666
+ "special": true
667
+ },
668
+ {
669
+ "id": 57589,
670
+ "content": "</s_lineNumber>",
671
+ "single_word": false,
672
+ "lstrip": false,
673
+ "rstrip": false,
674
+ "normalized": false,
675
+ "special": true
676
+ },
677
+ {
678
+ "id": 57590,
679
+ "content": "<s_fax>",
680
+ "single_word": false,
681
+ "lstrip": false,
682
+ "rstrip": false,
683
+ "normalized": false,
684
+ "special": true
685
+ },
686
+ {
687
+ "id": 57591,
688
+ "content": "</s_fax>",
689
+ "single_word": false,
690
+ "lstrip": false,
691
+ "rstrip": false,
692
+ "normalized": false,
693
+ "special": true
694
+ },
695
+ {
696
+ "id": 57592,
697
+ "content": "<s_email>",
698
+ "single_word": false,
699
+ "lstrip": false,
700
+ "rstrip": false,
701
+ "normalized": false,
702
+ "special": true
703
+ },
704
+ {
705
+ "id": 57593,
706
+ "content": "</s_email>",
707
+ "single_word": false,
708
+ "lstrip": false,
709
+ "rstrip": false,
710
+ "normalized": false,
711
+ "special": true
712
+ },
713
+ {
714
+ "id": 57594,
715
+ "content": "<s_date>",
716
+ "single_word": false,
717
+ "lstrip": false,
718
+ "rstrip": false,
719
+ "normalized": false,
720
+ "special": true
721
+ },
722
+ {
723
+ "id": 57595,
724
+ "content": "</s_date>",
725
+ "single_word": false,
726
+ "lstrip": false,
727
+ "rstrip": false,
728
+ "normalized": false,
729
+ "special": true
730
+ },
731
+ {
732
+ "id": 57596,
733
+ "content": "<s_company>",
734
+ "single_word": false,
735
+ "lstrip": false,
736
+ "rstrip": false,
737
+ "normalized": false,
738
+ "special": true
739
+ },
740
+ {
741
+ "id": 57597,
742
+ "content": "</s_company>",
743
+ "single_word": false,
744
+ "lstrip": false,
745
+ "rstrip": false,
746
+ "normalized": false,
747
+ "special": true
748
+ },
749
+ {
750
+ "id": 57598,
751
+ "content": "<s_address>",
752
+ "single_word": false,
753
+ "lstrip": false,
754
+ "rstrip": false,
755
+ "normalized": false,
756
+ "special": true
757
+ },
758
+ {
759
+ "id": 57599,
760
  "content": "</s_address>",
761
  "single_word": false,
762
  "lstrip": false,
tokenizer_config.json CHANGED
@@ -10,6 +10,7 @@
10
  "rstrip": false,
11
  "single_word": false
12
  },
 
13
  "name_or_path": "naver-clova-ix/donut-base-finetuned-cord-v2",
14
  "pad_token": "<pad>",
15
  "processor_class": "DonutProcessor",
 
10
  "rstrip": false,
11
  "single_word": false
12
  },
13
+ "model_max_length": 1000000000000000019884624838656,
14
  "name_or_path": "naver-clova-ix/donut-base-finetuned-cord-v2",
15
  "pad_token": "<pad>",
16
  "processor_class": "DonutProcessor",