eyeonyou commited on
Commit
39689c3
1 Parent(s): e9b7ace

Training in progress, epoch 1

Browse files
Files changed (28) hide show
  1. config.json +14 -58
  2. merges.txt +0 -0
  3. model.safetensors +2 -2
  4. runs/Apr25_11-02-50_1f13d83ecfdd/events.out.tfevents.1714042971.1f13d83ecfdd.9137.0 +3 -0
  5. runs/Apr25_11-04-32_1f13d83ecfdd/events.out.tfevents.1714043073.1f13d83ecfdd.9137.1 +3 -0
  6. runs/Apr25_11-04-42_1f13d83ecfdd/events.out.tfevents.1714043082.1f13d83ecfdd.9137.2 +3 -0
  7. runs/Apr25_11-04-49_1f13d83ecfdd/events.out.tfevents.1714043090.1f13d83ecfdd.9137.3 +3 -0
  8. runs/Apr25_11-04-56_1f13d83ecfdd/events.out.tfevents.1714043097.1f13d83ecfdd.9137.4 +3 -0
  9. runs/Apr25_11-05-22_1f13d83ecfdd/events.out.tfevents.1714043123.1f13d83ecfdd.9137.5 +3 -0
  10. runs/Apr25_11-31-05_1f13d83ecfdd/events.out.tfevents.1714044666.1f13d83ecfdd.9137.6 +3 -0
  11. runs/Apr25_11-41-37_1f13d83ecfdd/events.out.tfevents.1714045298.1f13d83ecfdd.9137.7 +3 -0
  12. runs/Apr25_11-43-50_1f13d83ecfdd/events.out.tfevents.1714045430.1f13d83ecfdd.9137.8 +3 -0
  13. runs/Apr25_11-44-07_1f13d83ecfdd/events.out.tfevents.1714045448.1f13d83ecfdd.9137.9 +3 -0
  14. runs/Apr25_11-50-56_1f13d83ecfdd/events.out.tfevents.1714045856.1f13d83ecfdd.9137.10 +3 -0
  15. runs/Apr25_12-08-46_1f13d83ecfdd/events.out.tfevents.1714046927.1f13d83ecfdd.9137.11 +3 -0
  16. runs/Apr25_12-09-14_1f13d83ecfdd/events.out.tfevents.1714046955.1f13d83ecfdd.9137.12 +3 -0
  17. runs/Apr25_12-09-37_1f13d83ecfdd/events.out.tfevents.1714046977.1f13d83ecfdd.9137.13 +3 -0
  18. runs/Apr25_12-10-39_1f13d83ecfdd/events.out.tfevents.1714047040.1f13d83ecfdd.9137.14 +3 -0
  19. runs/Apr25_12-12-57_1f13d83ecfdd/events.out.tfevents.1714047177.1f13d83ecfdd.9137.15 +3 -0
  20. runs/Apr25_12-14-17_1f13d83ecfdd/events.out.tfevents.1714047257.1f13d83ecfdd.9137.16 +3 -0
  21. runs/Apr25_12-15-59_1f13d83ecfdd/events.out.tfevents.1714047359.1f13d83ecfdd.9137.17 +3 -0
  22. runs/Apr25_12-19-01_1f13d83ecfdd/events.out.tfevents.1714047541.1f13d83ecfdd.9137.18 +3 -0
  23. runs/Apr25_12-24-12_1f13d83ecfdd/events.out.tfevents.1714047852.1f13d83ecfdd.9137.19 +3 -0
  24. runs/Apr25_12-25-30_1f13d83ecfdd/events.out.tfevents.1714047931.1f13d83ecfdd.9137.20 +3 -0
  25. tokenizer.json +0 -0
  26. tokenizer_config.json +4 -4
  27. training_args.bin +2 -2
  28. vocab.json +0 -0
config.json CHANGED
@@ -1,82 +1,38 @@
1
  {
2
- "_name_or_path": "ai-forever/ruRoberta-large",
3
  "architectures": [
4
  "RobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
- "bos_token_id": 1,
8
  "classifier_dropout": null,
9
  "eos_token_id": 2,
10
- "gradient_checkpointing": false,
11
  "hidden_act": "gelu",
12
  "hidden_dropout_prob": 0.1,
13
- "hidden_size": 1024,
14
  "id2label": {
15
- "0": "\u041f\u0440\u0438\u043a\u043b\u0430\u0434\u043d\u0430\u044f \u043c\u0430\u0442\u0435\u043c\u0430\u0442\u0438\u043a\u0430 \u0438 \u0438\u043d\u0444\u043e\u0440\u043c\u0430\u0442\u0438\u043a\u0430",
16
- "1": "\u0418\u043d\u0444\u043e\u0440\u043c\u0430\u0442\u0438\u043a\u0430 \u0438 \u0432\u044b\u0447\u0438\u0441\u043b\u0438\u0442\u0435\u043b\u044c\u043d\u0430\u044f \u0442\u0435\u0445\u043d\u0438\u043a\u0430. \u0418\u0441\u043a\u0443\u0441\u0441\u0442\u0432\u0435\u043d\u043d\u044b\u0439 \u0438\u043d\u0442\u0435\u043b\u043b\u0435\u043a\u0442",
17
- "2": "\u0418\u043d\u0444\u043e\u0440\u043c\u0430\u0442\u0438\u043a\u0430 \u0438 \u0432\u044b\u0447\u0438\u0441\u043b\u0438\u0442\u0435\u043b\u044c\u043d\u0430\u044f \u0442\u0435\u0445\u043d\u0438\u043a\u0430. \u041a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u043d\u043e\u0435 \u043c\u043e\u0434\u0435\u043b\u0438\u0440\u043e\u0432\u0430\u043d\u0438\u0435 \u0438 \u043f\u0440\u043e\u0435\u043a\u0442\u0438\u0440\u043e\u0432\u0430\u043d\u0438\u0435",
18
- "3": "\u0418\u043d\u0444\u043e\u0440\u043c\u0430\u0446\u0438\u043e\u043d\u043d\u044b\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b \u0438 \u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u0438",
19
- "4": "\u041f\u0440\u043e\u0433\u0440\u0430\u043c\u043c\u043d\u0430\u044f \u0438\u043d\u0436\u0435\u043d\u0435\u0440\u0438\u044f",
20
- "5": "\u041a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u043d\u0430\u044f \u0431\u0435\u0437\u043e\u043f\u0430\u0441\u043d\u043e\u0441\u0442\u044c",
21
- "6": "\u0420\u0430\u0434\u0438\u043e\u0442\u0435\u0445\u043d\u0438\u043a\u0430. \u0421\u0438\u0441\u0442\u0435\u043c\u044b \u043a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u043d\u043e\u0433\u043e \u0437\u0440\u0435\u043d\u0438\u044f",
22
- "7": "\u0420\u0430\u0434\u0438\u043e\u0442\u0435\u0445\u043d\u0438\u043a\u0430. \u0426\u0438\u0444\u0440\u043e\u0432\u044b\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b \u043b\u043e\u043a\u0430\u0446\u0438\u0438, \u0441\u0432\u044f\u0437\u0438 \u0438 \u043d\u0430\u0432\u0438\u0433\u0430\u0446\u0438\u0438",
23
- "8": "\u0418\u043d\u0444\u043e\u043a\u043e\u043c\u043c\u0443\u043d\u0438\u043a\u0430\u0446\u0438\u043e\u043d\u043d\u044b\u0435 \u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u0438 \u0438 \u0441\u0438\u0441\u0442\u0435\u043c\u044b \u0441\u0432\u044f\u0437\u0438",
24
- "9": "\u041a\u043e\u043d\u0441\u0442\u0440\u0443\u0438\u0440\u043e\u0432\u0430\u043d\u0438\u0435 \u0438 \u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u044f \u044d\u043b\u0435\u043a\u0442\u0440\u043e\u043d\u043d\u044b\u0445 \u0441\u0440\u0435\u0434\u0441\u0442\u0432",
25
- "10": "\u042d\u043b\u0435\u043a\u0442\u0440\u043e\u043d\u0438\u043a\u0430 \u0438 \u043d\u0430\u043d\u043e\u044d\u043b\u0435\u043a\u0442\u0440\u043e\u043d\u0438\u043a\u0430",
26
- "11": "\u0420\u0430\u0434\u0438\u043e\u044d\u043b\u0435\u043a\u0442\u0440\u043e\u043d\u043d\u044b\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b \u0438 \u043a\u043e\u043c\u043f\u043b\u0435\u043a\u0441\u044b",
27
- "12": "\u041f\u0440\u0438\u0431\u043e\u0440\u043e\u0441\u0442\u0440\u043e\u0435\u043d\u0438\u0435. \u0418\u043d\u0442\u0435\u043b\u043b\u0435\u043a\u0442\u0443\u0430\u043b\u044c\u043d\u044b\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b",
28
- "13": "\u0411\u0438\u043e\u0442\u0435\u0445\u043d\u0438\u0447\u0435\u0441\u043a\u0438\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b \u0438 \u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u0438",
29
- "14": "\u042d\u043b\u0435\u043a\u0442\u0440\u043e\u044d\u043d\u0435\u0440\u0433\u0435\u0442\u0438\u043a\u0430 \u0438 \u044d\u043b\u0435\u043a\u0442\u0440\u043e\u0442\u0435\u0445\u043d\u0438\u043a\u0430",
30
- "15": "\u041c\u0435\u0445\u0430\u0442\u0440\u043e\u043d\u0438\u043a\u0430 \u0438 \u0440\u043e\u0431\u043e\u0442\u043e\u0442\u0435\u0445\u043d\u0438\u043a\u0430",
31
- "16": "\u0422\u0435\u0445\u043d\u043e\u0441\u0444\u0435\u0440\u043d\u0430\u044f \u0431\u0435\u0437\u043e\u043f\u0430\u0441\u043d\u043e\u0441\u0442\u044c",
32
- "17": "\u0421\u0438\u0441\u0442\u0435\u043c\u043d\u044b\u0439 \u0430\u043d\u0430\u043b\u0438\u0437 \u0438 \u0443\u043f\u0440\u0430\u0432\u043b\u0435\u043d\u0438\u0435",
33
- "18": "\u0423\u043f\u0440\u0430\u0432\u043b\u0435\u043d\u0438\u0435 \u0432 \u0442\u0435\u0445\u043d\u0438\u0447\u0435\u0441\u043a\u0438\u0445 \u0441\u0438\u0441\u0442\u0435\u043c\u0430\u0445. \u041a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u043d\u044b\u0435 \u0438\u043d\u0442\u0435\u043b\u043b\u0435\u043a\u0442\u0443\u0430\u043b\u044c\u043d\u044b\u0435 \u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u0438 \u0443\u043f\u0440\u0430\u0432\u043b\u0435\u043d\u0438\u044f \u0432 \u0442\u0435\u0445\u043d\u0438\u0447\u0435\u0441\u043a\u0438\u0445 \u0441\u0438\u0441\u0442\u0435\u043c\u0430\u0445",
34
- "19": "\u0423\u043f\u0440\u0430\u0432\u043b\u0435\u043d\u0438\u0435 \u0432 \u0442\u0435\u0445\u043d\u0438\u0447\u0435\u0441\u043a\u0438\u0445 \u0441\u0438\u0441\u0442\u0435\u043c\u0430\u0445. \u0410\u0432\u0442\u043e\u043c\u0430\u0442\u0438\u043a\u0430 \u0438 \u0440\u043e\u0431\u043e\u0442\u043e\u0442\u0435\u0445\u043d\u0438\u0447\u0435\u0441\u043a\u0438\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b",
35
- "20": "\u0418\u043d\u043d\u043e\u0432\u0430\u0442\u0438\u043a\u0430",
36
- "21": "\u041d\u0430\u043d\u043e\u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u0438 \u0438 \u043c\u0438\u043a\u0440\u043e\u0441\u0438\u0441\u0442\u0435\u043c\u043d\u0430\u044f \u0442\u0435\u0445\u043d\u0438\u043a\u0430",
37
- "22": "\u041c\u0435\u043d\u0435\u0434\u0436\u043c\u0435\u043d\u0442",
38
- "23": "\u0420\u0435\u043a\u043b\u0430\u043c\u0430 \u0438 \u0441\u0432\u044f\u0437\u0438 \u0441 \u043e\u0431\u0449\u0435\u0441\u0442\u0432\u0435\u043d\u043d\u043e\u0441\u0442\u044c\u044e",
39
- "24": "\u041b\u0438\u043d\u0433\u0432\u0438\u0441\u0442\u0438\u043a\u0430"
40
  },
41
  "initializer_range": 0.02,
42
- "intermediate_size": 4096,
43
  "label2id": {
44
- "\u0411\u0438\u043e\u0442\u0435\u0445\u043d\u0438\u0447\u0435\u0441\u043a\u0438\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b \u0438 \u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u0438": 13,
45
- "\u0418\u043d\u043d\u043e\u0432\u0430\u0442\u0438\u043a\u0430": 20,
46
- "\u0418\u043d\u0444\u043e\u043a\u043e\u043c\u043c\u0443\u043d\u0438\u043a\u0430\u0446\u0438\u043e\u043d\u043d\u044b\u0435 \u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u0438 \u0438 \u0441\u0438\u0441\u0442\u0435\u043c\u044b \u0441\u0432\u044f\u0437\u0438": 8,
47
- "\u0418\u043d\u0444\u043e\u0440\u043c\u0430\u0442\u0438\u043a\u0430 \u0438 \u0432\u044b\u0447\u0438\u0441\u043b\u0438\u0442\u0435\u043b\u044c\u043d\u0430\u044f \u0442\u0435\u0445\u043d\u0438\u043a\u0430. \u0418\u0441\u043a\u0443\u0441\u0441\u0442\u0432\u0435\u043d\u043d\u044b\u0439 \u0438\u043d\u0442\u0435\u043b\u043b\u0435\u043a\u0442": 1,
48
- "\u0418\u043d\u0444\u043e\u0440\u043c\u0430\u0442\u0438\u043a\u0430 \u0438 \u0432\u044b\u0447\u0438\u0441\u043b\u0438\u0442\u0435\u043b\u044c\u043d\u0430\u044f \u0442\u0435\u0445\u043d\u0438\u043a\u0430. \u041a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u043d\u043e\u0435 \u043c\u043e\u0434\u0435\u043b\u0438\u0440\u043e\u0432\u0430\u043d\u0438\u0435 \u0438 \u043f\u0440\u043e\u0435\u043a\u0442\u0438\u0440\u043e\u0432\u0430\u043d\u0438\u0435": 2,
49
- "\u0418\u043d\u0444\u043e\u0440\u043c\u0430\u0446\u0438\u043e\u043d\u043d\u044b\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b \u0438 \u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u0438": 3,
50
- "\u041a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u043d\u0430\u044f \u0431\u0435\u0437\u043e\u043f\u0430\u0441\u043d\u043e\u0441\u0442\u044c": 5,
51
- "\u041a\u043e\u043d\u0441\u0442\u0440\u0443\u0438\u0440\u043e\u0432\u0430\u043d\u0438\u0435 \u0438 \u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u044f \u044d\u043b\u0435\u043a\u0442\u0440\u043e\u043d\u043d\u044b\u0445 \u0441\u0440\u0435\u0434\u0441\u0442\u0432": 9,
52
- "\u041b\u0438\u043d\u0433\u0432\u0438\u0441\u0442\u0438\u043a\u0430": 24,
53
- "\u041c\u0435\u043d\u0435\u0434\u0436\u043c\u0435\u043d\u0442": 22,
54
- "\u041c\u0435\u0445\u0430\u0442\u0440\u043e\u043d\u0438\u043a\u0430 \u0438 \u0440\u043e\u0431\u043e\u0442\u043e\u0442\u0435\u0445\u043d\u0438\u043a\u0430": 15,
55
- "\u041d\u0430\u043d\u043e\u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u0438 \u0438 \u043c\u0438\u043a\u0440\u043e\u0441\u0438\u0441\u0442\u0435\u043c\u043d\u0430\u044f \u0442\u0435\u0445\u043d\u0438\u043a\u0430": 21,
56
- "\u041f\u0440\u0438\u0431\u043e\u0440\u043e\u0441\u0442\u0440\u043e\u0435\u043d\u0438\u0435. \u0418\u043d\u0442\u0435\u043b\u043b\u0435\u043a\u0442\u0443\u0430\u043b\u044c\u043d\u044b\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b": 12,
57
- "\u041f\u0440\u0438\u043a\u043b\u0430\u0434\u043d\u0430\u044f \u043c\u0430\u0442\u0435\u043c\u0430\u0442\u0438\u043a\u0430 \u0438 \u0438\u043d\u0444\u043e\u0440\u043c\u0430\u0442\u0438\u043a\u0430": 0,
58
- "\u041f\u0440\u043e\u0433\u0440\u0430\u043c\u043c\u043d\u0430\u044f \u0438\u043d\u0436\u0435\u043d\u0435\u0440\u0438\u044f": 4,
59
- "\u0420\u0430\u0434\u0438\u043e\u0442\u0435\u0445\u043d\u0438\u043a\u0430. \u0421\u0438\u0441\u0442\u0435\u043c\u044b \u043a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u043d\u043e\u0433\u043e \u0437\u0440\u0435\u043d\u0438\u044f": 6,
60
- "\u0420\u0430\u0434\u0438\u043e\u0442\u0435\u0445\u043d\u0438\u043a\u0430. \u0426\u0438\u0444\u0440\u043e\u0432\u044b\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b \u043b\u043e\u043a\u0430\u0446\u0438\u0438, \u0441\u0432\u044f\u0437\u0438 \u0438 \u043d\u0430\u0432\u0438\u0433\u0430\u0446\u0438\u0438": 7,
61
- "\u0420\u0430\u0434\u0438\u043e\u044d\u043b\u0435\u043a\u0442\u0440\u043e\u043d\u043d\u044b\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b \u0438 \u043a\u043e\u043c\u043f\u043b\u0435\u043a\u0441\u044b": 11,
62
- "\u0420\u0435\u043a\u043b\u0430\u043c\u0430 \u0438 \u0441\u0432\u044f\u0437\u0438 \u0441 \u043e\u0431\u0449\u0435\u0441\u0442\u0432\u0435\u043d\u043d\u043e\u0441\u0442\u044c\u044e": 23,
63
- "\u0421\u0438\u0441\u0442\u0435\u043c\u043d\u044b\u0439 \u0430\u043d\u0430\u043b\u0438\u0437 \u0438 \u0443\u043f\u0440\u0430\u0432\u043b\u0435\u043d\u0438\u0435": 17,
64
- "\u0422\u0435\u0445\u043d\u043e\u0441\u0444\u0435\u0440\u043d\u0430\u044f \u0431\u0435\u0437\u043e\u043f\u0430\u0441\u043d\u043e\u0441\u0442\u044c": 16,
65
- "\u0423\u043f\u0440\u0430\u0432\u043b\u0435\u043d\u0438\u0435 \u0432 \u0442\u0435\u0445\u043d\u0438\u0447\u0435\u0441\u043a\u0438\u0445 \u0441\u0438\u0441\u0442\u0435\u043c\u0430\u0445. \u0410\u0432\u0442\u043e\u043c\u0430\u0442\u0438\u043a\u0430 \u0438 \u0440\u043e\u0431\u043e\u0442\u043e\u0442\u0435\u0445\u043d\u0438\u0447\u0435\u0441\u043a\u0438\u0435 \u0441\u0438\u0441\u0442\u0435\u043c\u044b": 19,
66
- "\u0423\u043f\u0440\u0430\u0432\u043b\u0435\u043d\u0438\u0435 \u0432 \u0442\u0435\u0445\u043d\u0438\u0447\u0435\u0441\u043a\u0438\u0445 \u0441\u0438\u0441\u0442\u0435\u043c\u0430\u0445. \u041a\u043e\u043c\u043f\u044c\u044e\u0442\u0435\u0440\u043d\u044b\u0435 \u0438\u043d\u0442\u0435\u043b\u043b\u0435\u043a\u0442\u0443\u0430\u043b\u044c\u043d\u044b\u0435 \u0442\u0435\u0445\u043d\u043e\u043b\u043e\u0433\u0438\u0438 \u0443\u043f\u0440\u0430\u0432\u043b\u0435\u043d\u0438\u044f \u0432 \u0442\u0435\u0445\u043d\u0438\u0447\u0435\u0441\u043a\u0438\u0445 \u0441\u0438\u0441\u0442\u0435\u043c\u0430\u0445": 18,
67
- "\u042d\u043b\u0435\u043a\u0442\u0440\u043e\u043d\u0438\u043a\u0430 \u0438 \u043d\u0430\u043d\u043e\u044d\u043b\u0435\u043a\u0442\u0440\u043e\u043d\u0438\u043a\u0430": 10,
68
- "\u042d\u043b\u0435\u043a\u0442\u0440\u043e\u044d\u043d\u0435\u0440\u0433\u0435\u0442\u0438\u043a\u0430 \u0438 \u044d\u043b\u0435\u043a\u0442\u0440\u043e\u0442\u0435\u0445\u043d\u0438\u043a\u0430": 14
69
  },
70
  "layer_norm_eps": 1e-05,
71
  "max_position_embeddings": 514,
72
  "model_type": "roberta",
73
- "num_attention_heads": 16,
74
- "num_hidden_layers": 24,
 
75
  "pad_token_id": 1,
76
  "position_embedding_type": "absolute",
77
  "problem_type": "single_label_classification",
78
  "torch_dtype": "float32",
79
- "transformers_version": "4.38.2",
80
  "type_vocab_size": 1,
81
  "use_cache": true,
82
  "vocab_size": 50265
 
1
  {
2
+ "_name_or_path": "microsoft/codebert-base",
3
  "architectures": [
4
  "RobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
  "classifier_dropout": null,
9
  "eos_token_id": 2,
 
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
  "id2label": {
14
+ "0": "Easy",
15
+ "1": "Medium",
16
+ "2": "Hard"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
17
  },
18
  "initializer_range": 0.02,
19
+ "intermediate_size": 3072,
20
  "label2id": {
21
+ "Easy": 0,
22
+ "Hard": 2,
23
+ "Medium": 1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
24
  },
25
  "layer_norm_eps": 1e-05,
26
  "max_position_embeddings": 514,
27
  "model_type": "roberta",
28
+ "num_attention_heads": 12,
29
+ "num_hidden_layers": 12,
30
+ "output_past": true,
31
  "pad_token_id": 1,
32
  "position_embedding_type": "absolute",
33
  "problem_type": "single_label_classification",
34
  "torch_dtype": "float32",
35
+ "transformers_version": "4.40.0",
36
  "type_vocab_size": 1,
37
  "use_cache": true,
38
  "vocab_size": 50265
merges.txt CHANGED
The diff for this file is too large to render. See raw diff
 
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd4de4d78bac6e8637b5c197d9572a29197c3ed492320bb9e5d16607e1d2cfb9
3
- size 1421589716
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:761675ea9e5c558deaee3d35bb114d20e99575da032ee55c457aa0a1cb84a459
3
+ size 498615900
runs/Apr25_11-02-50_1f13d83ecfdd/events.out.tfevents.1714042971.1f13d83ecfdd.9137.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86a6007e096e7520fa29ee53f5c0610d93b7640928ef9ef949fc85b2582ca724
3
+ size 4648
runs/Apr25_11-04-32_1f13d83ecfdd/events.out.tfevents.1714043073.1f13d83ecfdd.9137.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:715202e0d4ff311cd9a668f29a3b3af6d0d7a3e5a707081a786eebc84c1ce7ce
3
+ size 4654
runs/Apr25_11-04-42_1f13d83ecfdd/events.out.tfevents.1714043082.1f13d83ecfdd.9137.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bf01b7e16f23bf56da2df62b15561bfd8193e0af88feafbbfaee87f31c10a91
3
+ size 4648
runs/Apr25_11-04-49_1f13d83ecfdd/events.out.tfevents.1714043090.1f13d83ecfdd.9137.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf01b411c8db7fe808a3bb9d28f9ad70c8b6883715a114f872ba767a32829f80
3
+ size 4650
runs/Apr25_11-04-56_1f13d83ecfdd/events.out.tfevents.1714043097.1f13d83ecfdd.9137.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9336c6a534a6aafa4a0754ede8e41c4d63af2d168c5cc20116aa528b94d32f60
3
+ size 4648
runs/Apr25_11-05-22_1f13d83ecfdd/events.out.tfevents.1714043123.1f13d83ecfdd.9137.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a2dba09d2d3a66ecb1f48f5ec661c27f9db4f179e18ba64c4b4201be3e8f83b
3
+ size 4650
runs/Apr25_11-31-05_1f13d83ecfdd/events.out.tfevents.1714044666.1f13d83ecfdd.9137.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1835e54c44bce57a46b939a4c4a0a3d1d965ee15e041eaf496b6d8191df8c6d3
3
+ size 4652
runs/Apr25_11-41-37_1f13d83ecfdd/events.out.tfevents.1714045298.1f13d83ecfdd.9137.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:898d1a6ce96ede5f8a57ded752391ecc7e253f40eaab5c8096b5ce4b66b7a285
3
+ size 4652
runs/Apr25_11-43-50_1f13d83ecfdd/events.out.tfevents.1714045430.1f13d83ecfdd.9137.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd9c548bd84426dc7a9a139c9cb2c06460c61523eb91aaf80503e338450e9048
3
+ size 4663
runs/Apr25_11-44-07_1f13d83ecfdd/events.out.tfevents.1714045448.1f13d83ecfdd.9137.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e0580f3a3a1767a18bf03471c27434f60eea11637b1e9f7467d22aaf066156a
3
+ size 4663
runs/Apr25_11-50-56_1f13d83ecfdd/events.out.tfevents.1714045856.1f13d83ecfdd.9137.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:198a2b1655279ac6f5979262dff4ec1ffb77028e4b07a9683cb15b121584cb66
3
+ size 5014
runs/Apr25_12-08-46_1f13d83ecfdd/events.out.tfevents.1714046927.1f13d83ecfdd.9137.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd39f717f8f041c80ad23fa50271ae0515badb00125c2c5a792a9495d4b9f6ec
3
+ size 4852
runs/Apr25_12-09-14_1f13d83ecfdd/events.out.tfevents.1714046955.1f13d83ecfdd.9137.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88307d4de2ba2a77b9f4cfa081cc5da909a821c495d6db93e020654ac076bd76
3
+ size 4849
runs/Apr25_12-09-37_1f13d83ecfdd/events.out.tfevents.1714046977.1f13d83ecfdd.9137.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:404a2e88cd6018cfe37459c2de0f6be5ac80a5cfe5900fde8e02ab9e6ee920cd
3
+ size 4849
runs/Apr25_12-10-39_1f13d83ecfdd/events.out.tfevents.1714047040.1f13d83ecfdd.9137.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:186cfe4203d7311ecc4950e3b4e4f76b6a3455e636911f1db4f8c84ec19d3ca0
3
+ size 4849
runs/Apr25_12-12-57_1f13d83ecfdd/events.out.tfevents.1714047177.1f13d83ecfdd.9137.15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4257fa0910f27b8a32651dbc1f2895acb284765c42536380f3379a3bb519af8
3
+ size 4849
runs/Apr25_12-14-17_1f13d83ecfdd/events.out.tfevents.1714047257.1f13d83ecfdd.9137.16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73b7b7ff45e68dd20867c075d64f49d4d1ee83ae7443136942b9b1087d3de88b
3
+ size 4849
runs/Apr25_12-15-59_1f13d83ecfdd/events.out.tfevents.1714047359.1f13d83ecfdd.9137.17 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79ff9110492b655319698d45e9b47f1a5d6661bfb0ba59591c1c37eeb5d93d6c
3
+ size 4849
runs/Apr25_12-19-01_1f13d83ecfdd/events.out.tfevents.1714047541.1f13d83ecfdd.9137.18 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0caf54cbd2ce45b7ff92d47a1b6bb1032b5f0b3010b2c5be4f93a69c42d30e9
3
+ size 4849
runs/Apr25_12-24-12_1f13d83ecfdd/events.out.tfevents.1714047852.1f13d83ecfdd.9137.19 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb9e830f42cd9d38c7dbce3197f3626888899c3891498c0e50747f95b7e13000
3
+ size 5787
runs/Apr25_12-25-30_1f13d83ecfdd/events.out.tfevents.1714047931.1f13d83ecfdd.9137.20 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e17b7aa650c7e553b790410fa514b98081bd226d839623707bce84987451c25e
3
+ size 5541
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -2,7 +2,7 @@
2
  "add_prefix_space": false,
3
  "added_tokens_decoder": {
4
  "0": {
5
- "content": "<pad>",
6
  "lstrip": false,
7
  "normalized": true,
8
  "rstrip": false,
@@ -10,7 +10,7 @@
10
  "special": true
11
  },
12
  "1": {
13
- "content": "<s>",
14
  "lstrip": false,
15
  "normalized": true,
16
  "rstrip": false,
@@ -33,7 +33,7 @@
33
  "single_word": false,
34
  "special": true
35
  },
36
- "4": {
37
  "content": "<mask>",
38
  "lstrip": true,
39
  "normalized": false,
@@ -48,7 +48,7 @@
48
  "eos_token": "</s>",
49
  "errors": "replace",
50
  "mask_token": "<mask>",
51
- "model_max_length": 1000000000000000019884624838656,
52
  "pad_token": "<pad>",
53
  "sep_token": "</s>",
54
  "tokenizer_class": "RobertaTokenizer",
 
2
  "add_prefix_space": false,
3
  "added_tokens_decoder": {
4
  "0": {
5
+ "content": "<s>",
6
  "lstrip": false,
7
  "normalized": true,
8
  "rstrip": false,
 
10
  "special": true
11
  },
12
  "1": {
13
+ "content": "<pad>",
14
  "lstrip": false,
15
  "normalized": true,
16
  "rstrip": false,
 
33
  "single_word": false,
34
  "special": true
35
  },
36
+ "50264": {
37
  "content": "<mask>",
38
  "lstrip": true,
39
  "normalized": false,
 
48
  "eos_token": "</s>",
49
  "errors": "replace",
50
  "mask_token": "<mask>",
51
+ "model_max_length": 512,
52
  "pad_token": "<pad>",
53
  "sep_token": "</s>",
54
  "tokenizer_class": "RobertaTokenizer",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7a065c91798730e277d4323e5669d94466d06a306538c4f14aa077bd5b733c1
3
- size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4576c6e865530410771dfbb6d8bdf2094ab5a40071cf237bec8909f487296f37
3
+ size 4984
vocab.json CHANGED
The diff for this file is too large to render. See raw diff