idolezal commited on
Commit
37d296d
Β·
1 Parent(s): a658d09

Added specified metric for every task in "tasks_metadata.json"

Browse files
Files changed (1) hide show
  1. tasks_metadata.json +108 -54
tasks_metadata.json CHANGED
@@ -4,377 +4,431 @@
4
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_argumentace",
5
  "short_name": "P-Argumentace",
6
  "category": "NLI",
7
- "abbreviation": "P-ARG"
 
8
  },
9
  "benczechmark_propaganda_fabulace": {
10
  "name": "Propaganda – Fabulace",
11
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_fabulace",
12
  "short_name": "P-Fabulace",
13
  "category": "NLI",
14
- "abbreviation": "P-FAB"
 
15
  },
16
  "benczechmark_propaganda_nazor": {
17
  "name": "Propaganda – NΓ‘zor",
18
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_nazor",
19
  "short_name": "P-NΓ‘zor",
20
  "category": "NLI",
21
- "abbreviation": "P-NAZOR"
 
22
  },
23
  "benczechmark_propaganda_strach": {
24
  "name": "Propaganda – Strach",
25
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_strach",
26
  "short_name": "P-Strach",
27
  "category": "NLI",
28
- "abbreviation": "P-STCH"
 
29
  },
30
  "benczechmark_propaganda_zamereni": {
31
  "name": "Propaganda – ZamΔ›Ε™enΓ­",
32
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_zamereni",
33
  "short_name": "P-ZamΔ›Ε™enΓ­",
34
  "category": "NLI",
35
- "abbreviation": "P-MER"
 
36
  },
37
  "benczechmark_propaganda_demonizace": {
38
  "name": "Propaganda – DΓ©monizace",
39
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_demonizace",
40
  "short_name": "P-DΓ©monizace",
41
  "category": "NLI",
42
- "abbreviation": "P-DEMON"
 
43
  },
44
  "benczechmark_propaganda_lokace": {
45
  "name": "Propaganda – Lokace",
46
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_lokace",
47
  "short_name": "P-Lokace",
48
  "category": "NLI",
49
- "abbreviation": "P-LOK"
 
50
  },
51
  "benczechmark_propaganda_relativizace": {
52
  "name": "Propaganda – Relativizace",
53
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_relativizace",
54
  "short_name": "P-Relativizace",
55
  "category": "NLI",
56
- "abbreviation": "P-REL"
 
57
  },
58
  "benczechmark_propaganda_vina": {
59
  "name": "Propaganda – Vina",
60
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_vina",
61
  "short_name": "P-Vina",
62
  "category": "NLI",
63
- "abbreviation": "P-VINA"
 
64
  },
65
  "benczechmark_propaganda_zanr": {
66
  "name": "Propaganda – Ε½Γ‘nr",
67
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_zanr",
68
  "short_name": "P-Ε½Γ‘nr",
69
  "category": "NLI",
70
- "abbreviation": "P-ZANR"
 
71
  },
72
  "benczechmark_propaganda_emoce": {
73
  "name": "Propaganda – Emoce",
74
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_emoce",
75
  "short_name": "P-Emoce",
76
  "category": "NLI",
77
- "abbreviation": "P-EMOCE"
 
78
  },
79
  "benczechmark_propaganda_nalepkovani": {
80
  "name": "Propaganda – NΓ‘lepkovΓ‘nΓ­",
81
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_nalepkovani",
82
  "short_name": "P-NΓ‘lepkovΓ‘nΓ­",
83
  "category": "NLI",
84
- "abbreviation": "P-LEP"
 
85
  },
86
  "benczechmark_propaganda_rusko": {
87
  "name": "Propaganda – Rusko",
88
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_rusko",
89
  "short_name": "P-Rusko",
90
  "category": "NLI",
91
- "abbreviation": "P-RUS"
 
92
  },
93
  "benczechmark_sentiment_mall": {
94
  "name": "CzechSentiment MALL",
95
  "source_url": "https://huggingface.co/datasets/CZLC/mall_sentiment_balanced",
96
  "short_name": "S-Mall",
97
  "category": "Sentiment",
98
- "abbreviation": "S-MALL"
 
99
  },
100
  "benczechmark_sentiment_fb": {
101
  "name": "CzechSentiment FB",
102
  "source_url": "https://huggingface.co/datasets/CZLC/fb_sentiment_balanced",
103
  "short_name": "S-FB",
104
  "category": "Sentiment",
105
- "abbreviation": "S-FB"
 
106
  },
107
  "benczechmark_sentiment_csfd": {
108
  "name": "CzechSentiment CSFD",
109
  "source_url": "https://huggingface.co/datasets/CZLC/csfd_sentiment_balanced",
110
  "short_name": "S-CSFD",
111
  "category": "Sentiment",
112
- "abbreviation": "S-CSFD"
 
113
  },
114
  "benczechmark_summarization": {
115
  "name": "SUMECZECH",
116
  "source_url": "https://huggingface.co/datasets/CZLC/sumeczech_downsampled",
117
  "short_name": "Summarization",
118
  "category": "Summarization",
119
- "abbreviation": "SUM"
 
120
  },
121
  "benczechmark_grammarerrorcorrection": {
122
  "name": "GrammarErrorCorrection",
123
  "source_url": "https://huggingface.co/datasets/CZLC/cs_gec",
124
  "short_name": "Grammar Error Correction",
125
  "category": "Syntactical Reasoning",
126
- "abbreviation": "GEC"
 
127
  },
128
  "benczechmark_cs_naturalquestions": {
129
  "name": "NaturalQuestions-CZ",
130
  "source_url": "https://huggingface.co/datasets/CZLC/cs_naturalquestions",
131
  "short_name": "CS Natural Questions",
132
  "category": "Knowledge",
133
- "abbreviation": "NQ"
 
134
  },
135
  "benczechmark_cs_sqad32": {
136
  "name": "SQAD3.2",
137
  "source_url": "https://huggingface.co/datasets/CZLC/SQAD_3.2",
138
  "short_name": "CS SQAD 3.2",
139
  "category": "Knowledge",
140
- "abbreviation": "SQAD32"
 
141
  },
142
  "benczechmark_cs_triviaQA": {
143
  "name": "TriviaQA-CZ",
144
  "source_url": "https://huggingface.co/datasets/CZLC/cs_triviaqa",
145
  "short_name": "CS TriviaQA",
146
  "category": "Knowledge",
147
- "abbreviation": "TQA"
 
148
  },
149
  "benczechmark_csfever_nli": {
150
  "name": "CSFEVER",
151
  "source_url": "https://huggingface.co/datasets/CZLC/ctu-aic/csfever_nli",
152
  "short_name": "CSFever NLI",
153
  "category": "NLI",
154
- "abbreviation": "CFR"
 
155
  },
156
  "benczechmark_ctkfacts_nli": {
157
  "name": "CTKFACTS",
158
  "source_url": "https://huggingface.co/datasets/CZLC/ctu-aic/ctkfacts_nli",
159
  "short_name": "CTKFacts NLI",
160
  "category": "NLI",
161
- "abbreviation": "CTK"
 
162
  },
163
  "benczechmark_cs_ner": {
164
  "name": "Czech Named Entity Corpus 2.0\n",
165
  "source_url": "https://huggingface.co/datasets/CZLC/cnec_2.0",
166
  "short_name": "CNEC2.0",
167
  "category": "NER",
168
- "abbreviation": "CNEC"
 
169
  },
170
  "benczechmark_hellaswag": {
171
  "name": "HellaSwag-CZ",
172
  "source_url": "https://huggingface.co/datasets/CZLC/cs_hellaswag",
173
  "short_name": "HellaSwag",
174
  "category": "Language Modeling",
175
- "abbreviation": "HASG"
 
176
  },
177
  "benczechmark_histcorpus": {
178
  "name": "Historical Corpus",
179
  "source_url": "https://huggingface.co/datasets/CZLC/benczechmark_histcorpus",
180
  "short_name": "HistCorpus",
181
  "category": "Language Modeling",
182
- "abbreviation": "HIST"
 
183
  },
184
  "benczechmark_klokan_qa": {
185
  "name": "Klokan QA",
186
  "source_url": "https://huggingface.co/datasets/hynky/klokan-qa",
187
  "short_name": "Klokan QA",
188
  "category": "Czech Math Reasoning",
189
- "abbreviation": "KQA"
 
190
  },
191
  "benczechmark_cs_court_decisions_ner": {
192
  "name": "Czech Court Decisions",
193
  "source_url": "https://huggingface.co/datasets/CZLC/ner_court_decisions",
194
  "short_name": "CS Court Decisions NER",
195
  "category": "NER",
196
- "abbreviation": "CCDNER"
 
197
  },
198
  "benczechmark_umimeto_biology": {
199
  "name": "Umimeto.cz – Biology",
200
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/biology",
201
  "short_name": "Umimeto.cz – Biology",
202
  "category": "General Reasoning",
203
- "abbreviation": "UT-BIO"
 
204
  },
205
  "benczechmark_umimeto_chemistry": {
206
  "name": "Umimeto.cz – Chemistry",
207
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/chemistry",
208
  "short_name": "Umimeto.cz – Chemistry",
209
  "category": "General Reasoning",
210
- "abbreviation": "UT-CHEM"
 
211
  },
212
  "benczechmark_umimeto_czech": {
213
  "name": "Umimeto.cz – Czech Language",
214
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/czech",
215
  "short_name": "Umimeto.cz – Czech",
216
  "category": "General Reasoning",
217
- "abbreviation": "UT-CZEL"
 
218
  },
219
  "benczechmark_umimeto_history": {
220
  "name": "Umimeto.cz – History",
221
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/history",
222
  "short_name": "Umimeto.cz – History",
223
  "category": "General Reasoning",
224
- "abbreviation": "UT-HIST"
 
225
  },
226
  "benczechmark_umimeto_informatics": {
227
  "name": "Umimeto.cz – Informatics",
228
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/informatics",
229
  "short_name": "Umimeto.cz – Informatics",
230
  "category": "General Reasoning",
231
- "abbreviation": "UT-IT"
 
232
  },
233
  "benczechmark_umimeto_math": {
234
  "name": "Umimeto.cz οΏ½οΏ½οΏ½ Math",
235
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/math",
236
  "short_name": "Umimeto.cz – Math",
237
  "category": "Czech Math Reasoning",
238
- "abbreviation": "UT-MATH"
 
239
  },
240
  "benczechmark_umimeto_physics": {
241
  "name": "Umimeto.cz – Physics",
242
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/physics",
243
  "short_name": "Umimeto.cz – Physics",
244
  "category": "General Reasoning",
245
- "abbreviation": "UT-PHYS"
 
246
  },
247
  "benczechmark_cermat_czmath_mc": {
248
  "name": "CERMAT – Czech Math – MC",
249
  "source_url": "https://huggingface.co/datasets/CZLC/cermat_math_mc",
250
  "short_name": "Cermat Czech Math MC",
251
  "category": "Czech Math Reasoning",
252
- "abbreviation": "CCM-MC"
 
253
  },
254
  "benczechmark_cermat_czmath_open": {
255
  "name": "CERMAT – Czech Math – OPEN",
256
  "source_url": "https://huggingface.co/datasets/CZLC/cermat_math_open",
257
  "short_name": "Cermat Czech Math Open",
258
  "category": "Czech Math Reasoning",
259
- "abbreviation": "CCM-OPEN"
 
260
  },
261
  "benczechmark_cermat_czech_tf": {
262
  "name": "CERMAT – Czech Language – TF",
263
  "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_tf",
264
  "short_name": "Cermat Czech Language TF",
265
  "category": "General Reasoning",
266
- "abbreviation": "CCL-TF"
 
267
  },
268
  "benczechmark_cermat_czech_mc": {
269
  "name": "CERMAT – Czech Language – MC",
270
  "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_mc",
271
  "short_name": "Cermat Czech Language MC",
272
  "category": "General Reasoning",
273
- "abbreviation": "CCL-MC"
 
274
  },
275
  "benczechmark_cermat_czech_open": {
276
  "name": "CERMAT – Czech Language – OPEN",
277
  "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_open",
278
  "short_name": "Cermat Czech Language Open",
279
  "category": "General Reasoning",
280
- "abbreviation": "CCL-OPEN"
 
281
  },
282
  "benczechmark_history_ir": {
283
  "name": "Historical Relevance Grading",
284
  "source_url": "https://huggingface.co/datasets/CZLC/history_retrieval",
285
  "abbreviation": "HIST-IR",
286
  "category": "Historical",
287
- "short_name": "Czech History IR"
 
288
  },
289
  "benczechmark_agree": {
290
  "name": "Agree",
291
  "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_agree",
292
  "abbreviation": "Agree",
293
  "category": "Syntactical Reasoning",
294
- "short_name": "Agree"
 
295
  },
296
  "benczechmark_belebele": {
297
  "name": "Belebele",
298
  "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_belebele",
299
  "abbreviation": "BB",
300
  "category": "Knowledge",
301
- "short_name": "Belebele"
 
302
  },
303
  "benczechmark_czechnews": {
304
  "name": "CZ-NEWS",
305
  "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_czech_news",
306
  "abbreviation": "CZ-NEWS",
307
  "category": "Topic Classification",
308
- "short_name": "Czech News"
 
309
  },
310
  "benczechmark_subjectivity": {
311
  "name": "Subjectivity",
312
  "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_subjectivity",
313
  "abbreviation": "SUBJ",
314
  "category": "Sentiment",
315
- "short_name": "Subjectivity"
 
316
  },
317
  "benczechmark_essay": {
318
  "name": "Czech National Corpus – Essays",
319
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_skript12",
320
  "abbreviation": "CNC-E",
321
  "category": "Language Modeling",
322
- "short_name": "CNC – Essays"
 
323
  },
324
  "benczechmark_fiction": {
325
  "name": "Czech National Corpus – Fiction",
326
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_fictree",
327
  "abbreviation": "CNC-F",
328
  "category": "Language Modeling",
329
- "short_name": "CNC – Fiction"
 
330
  },
331
  "benczechmark_capek": {
332
  "name": "Czech National Corpus – Karel Čapek",
333
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_Capek",
334
  "abbreviation": "CNC-CAP",
335
  "category": "Language Modeling",
336
- "short_name": "CNC – Čapek"
 
337
  },
338
  "benczechmark_correspondence": {
339
  "name": "Czech National Corpus – Correspondence",
340
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_KSK",
341
  "abbreviation": "CNC-KSK",
342
  "category": "Language Modeling",
343
- "short_name": "CNC – Correspondence"
 
344
  },
345
  "benczechmark_havlicek": {
346
  "name": "Czech National Corpus – Karel Havlíček – Noviny",
347
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_KHavlicek_HistNews",
348
  "abbreviation": "CNC-KH",
349
  "category": "Language Modeling",
350
- "short_name": "CNC – KHavlicek – HistNews"
 
351
  },
352
  "benczechmark_speeches": {
353
  "name": "Czech National Corpus – Speeches",
354
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_PrezPrejavy",
355
  "abbreviation": "CNC-SPCH",
356
  "category": "Language Modeling",
357
- "short_name": "CNC – Speeches"
 
358
  },
359
  "benczechmark_spoken": {
360
  "name": "Czech National Corpus – Spoken",
361
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_oral_ortofon",
362
  "abbreviation": "CNC-SPK",
363
  "category": "Language Modeling",
364
- "short_name": "CNC – Spoken"
 
365
  },
366
  "benczechmark_dialect": {
367
  "name": "Czech National Corpus – Dialect",
368
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_Dialekt",
369
  "abbreviation": "CNC-DIAL",
370
  "category": "Language Modeling",
371
- "short_name": "CNC – DIALEKT"
 
372
  },
373
  "benczechmark_snli": {
374
  "name": "Czech SNLI",
375
  "source_url": "https://huggingface.co/datasets/CZLC/snli",
376
  "abbreviation": "SNLI",
377
  "category": "NLI",
378
- "short_name": "Czech SNLI"
 
379
  }
380
  }
 
4
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_argumentace",
5
  "short_name": "P-Argumentace",
6
  "category": "NLI",
7
+ "abbreviation": "P-ARG",
8
+ "metric": "avg_mcauroc"
9
  },
10
  "benczechmark_propaganda_fabulace": {
11
  "name": "Propaganda – Fabulace",
12
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_fabulace",
13
  "short_name": "P-Fabulace",
14
  "category": "NLI",
15
+ "abbreviation": "P-FAB",
16
+ "metric": "avg_mcauroc"
17
  },
18
  "benczechmark_propaganda_nazor": {
19
  "name": "Propaganda – NΓ‘zor",
20
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_nazor",
21
  "short_name": "P-NΓ‘zor",
22
  "category": "NLI",
23
+ "abbreviation": "P-NAZOR",
24
+ "metric": "avg_mcauroc"
25
  },
26
  "benczechmark_propaganda_strach": {
27
  "name": "Propaganda – Strach",
28
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_strach",
29
  "short_name": "P-Strach",
30
  "category": "NLI",
31
+ "abbreviation": "P-STCH",
32
+ "metric": "avg_mcauroc"
33
  },
34
  "benczechmark_propaganda_zamereni": {
35
  "name": "Propaganda – ZamΔ›Ε™enΓ­",
36
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_zamereni",
37
  "short_name": "P-ZamΔ›Ε™enΓ­",
38
  "category": "NLI",
39
+ "abbreviation": "P-MER",
40
+ "metric": "avg_mcauroc"
41
  },
42
  "benczechmark_propaganda_demonizace": {
43
  "name": "Propaganda – DΓ©monizace",
44
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_demonizace",
45
  "short_name": "P-DΓ©monizace",
46
  "category": "NLI",
47
+ "abbreviation": "P-DEMON",
48
+ "metric": "avg_mcauroc"
49
  },
50
  "benczechmark_propaganda_lokace": {
51
  "name": "Propaganda – Lokace",
52
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_lokace",
53
  "short_name": "P-Lokace",
54
  "category": "NLI",
55
+ "abbreviation": "P-LOK",
56
+ "metric": "avg_mcauroc"
57
  },
58
  "benczechmark_propaganda_relativizace": {
59
  "name": "Propaganda – Relativizace",
60
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_relativizace",
61
  "short_name": "P-Relativizace",
62
  "category": "NLI",
63
+ "abbreviation": "P-REL",
64
+ "metric": "avg_mcauroc"
65
  },
66
  "benczechmark_propaganda_vina": {
67
  "name": "Propaganda – Vina",
68
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_vina",
69
  "short_name": "P-Vina",
70
  "category": "NLI",
71
+ "abbreviation": "P-VINA",
72
+ "metric": "avg_mcauroc"
73
  },
74
  "benczechmark_propaganda_zanr": {
75
  "name": "Propaganda – Ε½Γ‘nr",
76
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_zanr",
77
  "short_name": "P-Ε½Γ‘nr",
78
  "category": "NLI",
79
+ "abbreviation": "P-ZANR",
80
+ "metric": "avg_mcauroc"
81
  },
82
  "benczechmark_propaganda_emoce": {
83
  "name": "Propaganda – Emoce",
84
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_emoce",
85
  "short_name": "P-Emoce",
86
  "category": "NLI",
87
+ "abbreviation": "P-EMOCE",
88
+ "metric": "avg_mcauroc"
89
  },
90
  "benczechmark_propaganda_nalepkovani": {
91
  "name": "Propaganda – NΓ‘lepkovΓ‘nΓ­",
92
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_nalepkovani",
93
  "short_name": "P-NΓ‘lepkovΓ‘nΓ­",
94
  "category": "NLI",
95
+ "abbreviation": "P-LEP",
96
+ "metric": "avg_mcauroc"
97
  },
98
  "benczechmark_propaganda_rusko": {
99
  "name": "Propaganda – Rusko",
100
  "source_url": "https://huggingface.co/datasets/CZLC/propaganda_rusko",
101
  "short_name": "P-Rusko",
102
  "category": "NLI",
103
+ "abbreviation": "P-RUS",
104
+ "metric": "avg_mcauroc"
105
  },
106
  "benczechmark_sentiment_mall": {
107
  "name": "CzechSentiment MALL",
108
  "source_url": "https://huggingface.co/datasets/CZLC/mall_sentiment_balanced",
109
  "short_name": "S-Mall",
110
  "category": "Sentiment",
111
+ "abbreviation": "S-MALL",
112
+ "metric": "avg_mcauroc"
113
  },
114
  "benczechmark_sentiment_fb": {
115
  "name": "CzechSentiment FB",
116
  "source_url": "https://huggingface.co/datasets/CZLC/fb_sentiment_balanced",
117
  "short_name": "S-FB",
118
  "category": "Sentiment",
119
+ "abbreviation": "S-FB",
120
+ "metric": "avg_mcauroc"
121
  },
122
  "benczechmark_sentiment_csfd": {
123
  "name": "CzechSentiment CSFD",
124
  "source_url": "https://huggingface.co/datasets/CZLC/csfd_sentiment_balanced",
125
  "short_name": "S-CSFD",
126
  "category": "Sentiment",
127
+ "abbreviation": "S-CSFD",
128
+ "metric": "avg_mcauroc"
129
  },
130
  "benczechmark_summarization": {
131
  "name": "SUMECZECH",
132
  "source_url": "https://huggingface.co/datasets/CZLC/sumeczech_downsampled",
133
  "short_name": "Summarization",
134
  "category": "Summarization",
135
+ "abbreviation": "SUM",
136
+ "metric": "rouge_raw_r2_mid_f"
137
  },
138
  "benczechmark_grammarerrorcorrection": {
139
  "name": "GrammarErrorCorrection",
140
  "source_url": "https://huggingface.co/datasets/CZLC/cs_gec",
141
  "short_name": "Grammar Error Correction",
142
  "category": "Syntactical Reasoning",
143
+ "abbreviation": "GEC",
144
+ "metric": "avg_mcauroc"
145
  },
146
  "benczechmark_cs_naturalquestions": {
147
  "name": "NaturalQuestions-CZ",
148
  "source_url": "https://huggingface.co/datasets/CZLC/cs_naturalquestions",
149
  "short_name": "CS Natural Questions",
150
  "category": "Knowledge",
151
+ "abbreviation": "NQ",
152
+ "metric": "exact_match"
153
  },
154
  "benczechmark_cs_sqad32": {
155
  "name": "SQAD3.2",
156
  "source_url": "https://huggingface.co/datasets/CZLC/SQAD_3.2",
157
  "short_name": "CS SQAD 3.2",
158
  "category": "Knowledge",
159
+ "abbreviation": "SQAD32",
160
+ "metric": "exact_match"
161
  },
162
  "benczechmark_cs_triviaQA": {
163
  "name": "TriviaQA-CZ",
164
  "source_url": "https://huggingface.co/datasets/CZLC/cs_triviaqa",
165
  "short_name": "CS TriviaQA",
166
  "category": "Knowledge",
167
+ "abbreviation": "TQA",
168
+ "metric": "exact_match"
169
  },
170
  "benczechmark_csfever_nli": {
171
  "name": "CSFEVER",
172
  "source_url": "https://huggingface.co/datasets/CZLC/ctu-aic/csfever_nli",
173
  "short_name": "CSFever NLI",
174
  "category": "NLI",
175
+ "abbreviation": "CFR",
176
+ "metric": "avg_mcauroc"
177
  },
178
  "benczechmark_ctkfacts_nli": {
179
  "name": "CTKFACTS",
180
  "source_url": "https://huggingface.co/datasets/CZLC/ctu-aic/ctkfacts_nli",
181
  "short_name": "CTKFacts NLI",
182
  "category": "NLI",
183
+ "abbreviation": "CTK",
184
+ "metric": "avg_mcauroc"
185
  },
186
  "benczechmark_cs_ner": {
187
  "name": "Czech Named Entity Corpus 2.0\n",
188
  "source_url": "https://huggingface.co/datasets/CZLC/cnec_2.0",
189
  "short_name": "CNEC2.0",
190
  "category": "NER",
191
+ "abbreviation": "CNEC",
192
+ "metric": "exact_match"
193
  },
194
  "benczechmark_hellaswag": {
195
  "name": "HellaSwag-CZ",
196
  "source_url": "https://huggingface.co/datasets/CZLC/cs_hellaswag",
197
  "short_name": "HellaSwag",
198
  "category": "Language Modeling",
199
+ "abbreviation": "HASG",
200
+ "metric": "acc"
201
  },
202
  "benczechmark_histcorpus": {
203
  "name": "Historical Corpus",
204
  "source_url": "https://huggingface.co/datasets/CZLC/benczechmark_histcorpus",
205
  "short_name": "HistCorpus",
206
  "category": "Language Modeling",
207
+ "abbreviation": "HIST",
208
+ "metric": "word_perplexity"
209
  },
210
  "benczechmark_klokan_qa": {
211
  "name": "Klokan QA",
212
  "source_url": "https://huggingface.co/datasets/hynky/klokan-qa",
213
  "short_name": "Klokan QA",
214
  "category": "Czech Math Reasoning",
215
+ "abbreviation": "KQA",
216
+ "metric": "acc"
217
  },
218
  "benczechmark_cs_court_decisions_ner": {
219
  "name": "Czech Court Decisions",
220
  "source_url": "https://huggingface.co/datasets/CZLC/ner_court_decisions",
221
  "short_name": "CS Court Decisions NER",
222
  "category": "NER",
223
+ "abbreviation": "CCDNER",
224
+ "metric": "exact_match"
225
  },
226
  "benczechmark_umimeto_biology": {
227
  "name": "Umimeto.cz – Biology",
228
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/biology",
229
  "short_name": "Umimeto.cz – Biology",
230
  "category": "General Reasoning",
231
+ "abbreviation": "UT-BIO",
232
+ "metric": "acc"
233
  },
234
  "benczechmark_umimeto_chemistry": {
235
  "name": "Umimeto.cz – Chemistry",
236
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/chemistry",
237
  "short_name": "Umimeto.cz – Chemistry",
238
  "category": "General Reasoning",
239
+ "abbreviation": "UT-CHEM",
240
+ "metric": "acc"
241
  },
242
  "benczechmark_umimeto_czech": {
243
  "name": "Umimeto.cz – Czech Language",
244
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/czech",
245
  "short_name": "Umimeto.cz – Czech",
246
  "category": "General Reasoning",
247
+ "abbreviation": "UT-CZEL",
248
+ "metric": "acc"
249
  },
250
  "benczechmark_umimeto_history": {
251
  "name": "Umimeto.cz – History",
252
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/history",
253
  "short_name": "Umimeto.cz – History",
254
  "category": "General Reasoning",
255
+ "abbreviation": "UT-HIST",
256
+ "metric": "acc"
257
  },
258
  "benczechmark_umimeto_informatics": {
259
  "name": "Umimeto.cz – Informatics",
260
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/informatics",
261
  "short_name": "Umimeto.cz – Informatics",
262
  "category": "General Reasoning",
263
+ "abbreviation": "UT-IT",
264
+ "metric": "acc"
265
  },
266
  "benczechmark_umimeto_math": {
267
  "name": "Umimeto.cz οΏ½οΏ½οΏ½ Math",
268
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/math",
269
  "short_name": "Umimeto.cz – Math",
270
  "category": "Czech Math Reasoning",
271
+ "abbreviation": "UT-MATH",
272
+ "metric": "acc"
273
  },
274
  "benczechmark_umimeto_physics": {
275
  "name": "Umimeto.cz – Physics",
276
  "source_url": "https://huggingface.co/datasets/CZLC/umimeto-qa/viewer/physics",
277
  "short_name": "Umimeto.cz – Physics",
278
  "category": "General Reasoning",
279
+ "abbreviation": "UT-PHYS",
280
+ "metric": "acc"
281
  },
282
  "benczechmark_cermat_czmath_mc": {
283
  "name": "CERMAT – Czech Math – MC",
284
  "source_url": "https://huggingface.co/datasets/CZLC/cermat_math_mc",
285
  "short_name": "Cermat Czech Math MC",
286
  "category": "Czech Math Reasoning",
287
+ "abbreviation": "CCM-MC",
288
+ "metric": "acc"
289
  },
290
  "benczechmark_cermat_czmath_open": {
291
  "name": "CERMAT – Czech Math – OPEN",
292
  "source_url": "https://huggingface.co/datasets/CZLC/cermat_math_open",
293
  "short_name": "Cermat Czech Math Open",
294
  "category": "Czech Math Reasoning",
295
+ "abbreviation": "CCM-OPEN",
296
+ "metric": "exact_match"
297
  },
298
  "benczechmark_cermat_czech_tf": {
299
  "name": "CERMAT – Czech Language – TF",
300
  "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_tf",
301
  "short_name": "Cermat Czech Language TF",
302
  "category": "General Reasoning",
303
+ "abbreviation": "CCL-TF",
304
+ "metric": "avg_mcauroc"
305
  },
306
  "benczechmark_cermat_czech_mc": {
307
  "name": "CERMAT – Czech Language – MC",
308
  "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_mc",
309
  "short_name": "Cermat Czech Language MC",
310
  "category": "General Reasoning",
311
+ "abbreviation": "CCL-MC",
312
+ "metric": "acc"
313
  },
314
  "benczechmark_cermat_czech_open": {
315
  "name": "CERMAT – Czech Language – OPEN",
316
  "source_url": "https://huggingface.co/datasets/CZLC/cermat_czech_open",
317
  "short_name": "Cermat Czech Language Open",
318
  "category": "General Reasoning",
319
+ "abbreviation": "CCL-OPEN",
320
+ "metric": "exact_match"
321
  },
322
  "benczechmark_history_ir": {
323
  "name": "Historical Relevance Grading",
324
  "source_url": "https://huggingface.co/datasets/CZLC/history_retrieval",
325
  "abbreviation": "HIST-IR",
326
  "category": "Historical",
327
+ "short_name": "Czech History IR",
328
+ "metric": "acc"
329
  },
330
  "benczechmark_agree": {
331
  "name": "Agree",
332
  "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_agree",
333
  "abbreviation": "Agree",
334
  "category": "Syntactical Reasoning",
335
+ "short_name": "Agree",
336
+ "metric": "avg_mcauroc"
337
  },
338
  "benczechmark_belebele": {
339
  "name": "Belebele",
340
  "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_belebele",
341
  "abbreviation": "BB",
342
  "category": "Knowledge",
343
+ "short_name": "Belebele",
344
+ "metric": "acc"
345
  },
346
  "benczechmark_czechnews": {
347
  "name": "CZ-NEWS",
348
  "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_czech_news",
349
  "abbreviation": "CZ-NEWS",
350
  "category": "Topic Classification",
351
+ "short_name": "Czech News",
352
+ "metric": "avg_mcauroc"
353
  },
354
  "benczechmark_subjectivity": {
355
  "name": "Subjectivity",
356
  "source_url": "https://huggingface.co/datasets/davidadamczyk/czechbench_subjectivity",
357
  "abbreviation": "SUBJ",
358
  "category": "Sentiment",
359
+ "short_name": "Subjectivity",
360
+ "metric": "avg_mcauroc"
361
  },
362
  "benczechmark_essay": {
363
  "name": "Czech National Corpus – Essays",
364
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_skript12",
365
  "abbreviation": "CNC-E",
366
  "category": "Language Modeling",
367
+ "short_name": "CNC – Essays",
368
+ "metric": "word_perplexity"
369
  },
370
  "benczechmark_fiction": {
371
  "name": "Czech National Corpus – Fiction",
372
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_fictree",
373
  "abbreviation": "CNC-F",
374
  "category": "Language Modeling",
375
+ "short_name": "CNC – Fiction",
376
+ "metric": "word_perplexity"
377
  },
378
  "benczechmark_capek": {
379
  "name": "Czech National Corpus – Karel Čapek",
380
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_Capek",
381
  "abbreviation": "CNC-CAP",
382
  "category": "Language Modeling",
383
+ "short_name": "CNC – Čapek",
384
+ "metric": "word_perplexity"
385
  },
386
  "benczechmark_correspondence": {
387
  "name": "Czech National Corpus – Correspondence",
388
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_KSK",
389
  "abbreviation": "CNC-KSK",
390
  "category": "Language Modeling",
391
+ "short_name": "CNC – Correspondence",
392
+ "metric": "word_perplexity"
393
  },
394
  "benczechmark_havlicek": {
395
  "name": "Czech National Corpus – Karel Havlíček – Noviny",
396
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_KHavlicek_HistNews",
397
  "abbreviation": "CNC-KH",
398
  "category": "Language Modeling",
399
+ "short_name": "CNC – KHavlicek – HistNews",
400
+ "metric": "word_perplexity"
401
  },
402
  "benczechmark_speeches": {
403
  "name": "Czech National Corpus – Speeches",
404
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_PrezPrejavy",
405
  "abbreviation": "CNC-SPCH",
406
  "category": "Language Modeling",
407
+ "short_name": "CNC – Speeches",
408
+ "metric": "word_perplexity"
409
  },
410
  "benczechmark_spoken": {
411
  "name": "Czech National Corpus – Spoken",
412
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_oral_ortofon",
413
  "abbreviation": "CNC-SPK",
414
  "category": "Language Modeling",
415
+ "short_name": "CNC – Spoken",
416
+ "metric": "word_perplexity"
417
  },
418
  "benczechmark_dialect": {
419
  "name": "Czech National Corpus – Dialect",
420
  "source_url": "https://huggingface.co/datasets/CZLC/CNC_Dialekt",
421
  "abbreviation": "CNC-DIAL",
422
  "category": "Language Modeling",
423
+ "short_name": "CNC – DIALEKT",
424
+ "metric": "word_perplexity"
425
  },
426
  "benczechmark_snli": {
427
  "name": "Czech SNLI",
428
  "source_url": "https://huggingface.co/datasets/CZLC/snli",
429
  "abbreviation": "SNLI",
430
  "category": "NLI",
431
+ "short_name": "Czech SNLI",
432
+ "metric": "avg_mcauroc"
433
  }
434
  }