karimouda commited on
Commit
a520977
1 Parent(s): 3881202

Update README.md

Browse files

Adding MTEB results

Files changed (1) hide show
  1. README.md +533 -59
README.md CHANGED
@@ -19,77 +19,551 @@ tags:
19
  - feature-extraction
20
  - generated_from_trainer
21
  - loss:CosineSimilarityLoss
 
22
  model-index:
23
- - name: silma-embeddding-matryoshka-0.1
24
  results:
25
- - task:
26
- type: semantic-similarity
27
- name: Semantic Similarity
28
- dataset:
29
- config: ar-ar
30
- name: MTEB STS17 (ar-ar)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
31
  revision: faeb762787bd10488a50c8b5be4a3b82e411949c
32
  split: test
33
  type: mteb/sts17-crosslingual-sts
34
  metrics:
35
- - type: pearson_cosine
36
- value: 0.8412612492708037
37
- name: Pearson Cosine
38
- - type: spearman_cosine
39
- value: 0.8424703763883515
40
- name: Spearman Cosine
41
- - type: pearson_manhattan
42
- value: 0.8118466522597414
43
- name: Pearson Manhattan
44
- - type: spearman_manhattan
45
- value: 0.8261184409962614
46
- name: Spearman Manhattan
47
- - type: pearson_euclidean
48
- value: 0.8138085140113648
49
- name: Pearson Euclidean
50
- - type: spearman_euclidean
51
- value: 0.8317403450502965
52
- name: Spearman Euclidean
53
- - type: pearson_dot
54
- value: 0.8412612546419626
55
- name: Pearson Dot
56
- - type: spearman_dot
57
- value: 0.8425077492152536
58
- name: Spearman Dot
59
- - task:
60
- type: semantic-similarity
61
- name: Semantic Similarity
62
- dataset:
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  config: en-ar
64
  name: MTEB STS17 (en-ar)
65
  revision: faeb762787bd10488a50c8b5be4a3b82e411949c
66
  split: test
67
  type: mteb/sts17-crosslingual-sts
68
  metrics:
69
- - type: pearson_cosine
70
- value: 0.43375293277885835
71
- name: Pearson Cosine
72
- - type: spearman_cosine
73
- value: 0.42763149514327226
74
- name: Spearman Cosine
75
- - type: pearson_manhattan
76
- value: 0.40498576814866555
77
- name: Pearson Manhattan
78
- - type: spearman_manhattan
79
- value: 0.40636693141664754
80
- name: Spearman Manhattan
81
- - type: pearson_euclidean
82
- value: 0.39625411905897395
83
- name: Pearson Euclidean
84
- - type: spearman_euclidean
85
- value: 0.3926727199746294
86
- name: Spearman Euclidean
87
- - type: pearson_dot
88
- value: 0.4337529078998193
89
- name: Pearson Dot
90
- - type: spearman_dot
91
- value: 0.42763149514327226
92
- name: Spearman Dot
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
93
  license: apache-2.0
94
  language:
95
  - ar
 
19
  - feature-extraction
20
  - generated_from_trainer
21
  - loss:CosineSimilarityLoss
22
+ - mteb
23
  model-index:
24
+ - name: silma-ai/silma-embeddding-matryoshka-v0.1
25
  results:
26
+ - dataset:
27
+ config: ar
28
+ name: MTEB MassiveIntentClassification (ar)
29
+ revision: 4672e20407010da34463acc759c162ca9734bca6
30
+ split: test
31
+ type: mteb/amazon_massive_intent
32
+ metrics:
33
+ - type: accuracy
34
+ value: 56.445864156018835
35
+ - type: f1
36
+ value: 53.58282538318122
37
+ - type: f1_weighted
38
+ value: 56.821808211639315
39
+ - type: main_score
40
+ value: 56.445864156018835
41
+ task:
42
+ type: Classification
43
+ - dataset:
44
+ config: en
45
+ name: MTEB MassiveIntentClassification (en)
46
+ revision: 4672e20407010da34463acc759c162ca9734bca6
47
+ split: test
48
+ type: mteb/amazon_massive_intent
49
+ metrics:
50
+ - type: accuracy
51
+ value: 47.40080699394754
52
+ - type: f1
53
+ value: 44.729286773524755
54
+ - type: f1_weighted
55
+ value: 47.83506683571795
56
+ - type: main_score
57
+ value: 47.40080699394754
58
+ task:
59
+ type: Classification
60
+ - dataset:
61
+ config: ar
62
+ name: MTEB MassiveIntentClassification (ar)
63
+ revision: 4672e20407010da34463acc759c162ca9734bca6
64
+ split: validation
65
+ type: mteb/amazon_massive_intent
66
+ metrics:
67
+ - type: accuracy
68
+ value: 56.97983275946876
69
+ - type: f1
70
+ value: 53.809263807080086
71
+ - type: f1_weighted
72
+ value: 57.14993215193604
73
+ - type: main_score
74
+ value: 56.97983275946876
75
+ task:
76
+ type: Classification
77
+ - dataset:
78
+ config: en
79
+ name: MTEB MassiveIntentClassification (en)
80
+ revision: 4672e20407010da34463acc759c162ca9734bca6
81
+ split: validation
82
+ type: mteb/amazon_massive_intent
83
+ metrics:
84
+ - type: accuracy
85
+ value: 47.683226758485006
86
+ - type: f1
87
+ value: 44.905317333393775
88
+ - type: f1_weighted
89
+ value: 48.051379514830195
90
+ - type: main_score
91
+ value: 47.683226758485006
92
+ task:
93
+ type: Classification
94
+ - dataset:
95
+ config: ar
96
+ name: MTEB MassiveScenarioClassification (ar)
97
+ revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
98
+ split: test
99
+ type: mteb/amazon_massive_scenario
100
+ metrics:
101
+ - type: accuracy
102
+ value: 63.31876260928042
103
+ - type: f1
104
+ value: 63.197056314678754
105
+ - type: f1_weighted
106
+ value: 62.7166315473092
107
+ - type: main_score
108
+ value: 63.31876260928042
109
+ task:
110
+ type: Classification
111
+ - dataset:
112
+ config: en
113
+ name: MTEB MassiveScenarioClassification (en)
114
+ revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
115
+ split: test
116
+ type: mteb/amazon_massive_scenario
117
+ metrics:
118
+ - type: accuracy
119
+ value: 53.35574983187627
120
+ - type: f1
121
+ value: 50.35837223252574
122
+ - type: f1_weighted
123
+ value: 54.11644042208904
124
+ - type: main_score
125
+ value: 53.35574983187627
126
+ task:
127
+ type: Classification
128
+ - dataset:
129
+ config: ar
130
+ name: MTEB MassiveScenarioClassification (ar)
131
+ revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
132
+ split: validation
133
+ type: mteb/amazon_massive_scenario
134
+ metrics:
135
+ - type: accuracy
136
+ value: 62.26758484997541
137
+ - type: f1
138
+ value: 62.477928166560325
139
+ - type: f1_weighted
140
+ value: 61.92238394647396
141
+ - type: main_score
142
+ value: 62.26758484997541
143
+ task:
144
+ type: Classification
145
+ - dataset:
146
+ config: en
147
+ name: MTEB MassiveScenarioClassification (en)
148
+ revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
149
+ split: validation
150
+ type: mteb/amazon_massive_scenario
151
+ metrics:
152
+ - type: accuracy
153
+ value: 52.62174126906049
154
+ - type: f1
155
+ value: 50.470501485026716
156
+ - type: f1_weighted
157
+ value: 53.16459392827557
158
+ - type: main_score
159
+ value: 52.62174126906049
160
+ task:
161
+ type: Classification
162
+ - dataset:
163
+ config: en-en
164
+ name: MTEB STS17 (en-en)
165
  revision: faeb762787bd10488a50c8b5be4a3b82e411949c
166
  split: test
167
  type: mteb/sts17-crosslingual-sts
168
  metrics:
169
+ - type: cosine_pearson
170
+ value: 74.33941506827517
171
+ - type: cosine_spearman
172
+ value: 74.42197838273297
173
+ - type: euclidean_pearson
174
+ value: 75.33836191339782
175
+ - type: euclidean_spearman
176
+ value: 74.37385193453852
177
+ - type: main_score
178
+ value: 74.42197838273297
179
+ - type: manhattan_pearson
180
+ value: 75.41881517194568
181
+ - type: manhattan_spearman
182
+ value: 74.47237277057877
183
+ - type: pearson
184
+ value: 74.33941645999855
185
+ - type: spearman
186
+ value: 74.42197838273297
187
+ task:
188
+ type: STS
189
+ - dataset:
190
+ config: nl-en
191
+ name: MTEB STS17 (nl-en)
192
+ revision: faeb762787bd10488a50c8b5be4a3b82e411949c
193
+ split: test
194
+ type: mteb/sts17-crosslingual-sts
195
+ metrics:
196
+ - type: cosine_pearson
197
+ value: 31.84872826199112
198
+ - type: cosine_spearman
199
+ value: 32.22496230755917
200
+ - type: euclidean_pearson
201
+ value: 21.830860533929688
202
+ - type: euclidean_spearman
203
+ value: 21.38205815348658
204
+ - type: main_score
205
+ value: 32.22496230755917
206
+ - type: manhattan_pearson
207
+ value: 21.852430479395576
208
+ - type: manhattan_spearman
209
+ value: 21.37848326556159
210
+ - type: pearson
211
+ value: 31.84872485436001
212
+ - type: spearman
213
+ value: 32.22496230755917
214
+ task:
215
+ type: STS
216
+ - dataset:
217
  config: en-ar
218
  name: MTEB STS17 (en-ar)
219
  revision: faeb762787bd10488a50c8b5be4a3b82e411949c
220
  split: test
221
  type: mteb/sts17-crosslingual-sts
222
  metrics:
223
+ - type: cosine_pearson
224
+ value: 43.37529327788584
225
+ - type: cosine_spearman
226
+ value: 42.763149514327225
227
+ - type: euclidean_pearson
228
+ value: 39.625411905897394
229
+ - type: euclidean_spearman
230
+ value: 39.26727199746294
231
+ - type: main_score
232
+ value: 42.763149514327225
233
+ - type: manhattan_pearson
234
+ value: 40.49857681486655
235
+ - type: manhattan_spearman
236
+ value: 40.63669314166475
237
+ - type: pearson
238
+ value: 43.37529078998193
239
+ - type: spearman
240
+ value: 42.763149514327225
241
+ task:
242
+ type: STS
243
+ - dataset:
244
+ config: en-tr
245
+ name: MTEB STS17 (en-tr)
246
+ revision: faeb762787bd10488a50c8b5be4a3b82e411949c
247
+ split: test
248
+ type: mteb/sts17-crosslingual-sts
249
+ metrics:
250
+ - type: cosine_pearson
251
+ value: 17.16722415938186
252
+ - type: cosine_spearman
253
+ value: 15.590330355526344
254
+ - type: euclidean_pearson
255
+ value: 4.430499555984906
256
+ - type: euclidean_spearman
257
+ value: 2.729050802084264
258
+ - type: main_score
259
+ value: 15.590330355526344
260
+ - type: manhattan_pearson
261
+ value: 2.805408490135879
262
+ - type: manhattan_spearman
263
+ value: 1.5237347692119627
264
+ - type: pearson
265
+ value: 17.167228709176676
266
+ - type: spearman
267
+ value: 15.590330355526344
268
+ task:
269
+ type: STS
270
+ - dataset:
271
+ config: fr-en
272
+ name: MTEB STS17 (fr-en)
273
+ revision: faeb762787bd10488a50c8b5be4a3b82e411949c
274
+ split: test
275
+ type: mteb/sts17-crosslingual-sts
276
+ metrics:
277
+ - type: cosine_pearson
278
+ value: 36.093945717347395
279
+ - type: cosine_spearman
280
+ value: 37.33997345407934
281
+ - type: euclidean_pearson
282
+ value: 23.156103022485055
283
+ - type: euclidean_spearman
284
+ value: 20.62925594786342
285
+ - type: main_score
286
+ value: 37.33997345407934
287
+ - type: manhattan_pearson
288
+ value: 22.035024322719813
289
+ - type: manhattan_spearman
290
+ value: 19.147522562438795
291
+ - type: pearson
292
+ value: 36.09395175426761
293
+ - type: spearman
294
+ value: 37.33997345407934
295
+ task:
296
+ type: STS
297
+ - dataset:
298
+ config: en-de
299
+ name: MTEB STS17 (en-de)
300
+ revision: faeb762787bd10488a50c8b5be4a3b82e411949c
301
+ split: test
302
+ type: mteb/sts17-crosslingual-sts
303
+ metrics:
304
+ - type: cosine_pearson
305
+ value: 29.064411455563
306
+ - type: cosine_spearman
307
+ value: 29.232781114344697
308
+ - type: euclidean_pearson
309
+ value: 16.90458086330736
310
+ - type: euclidean_spearman
311
+ value: 17.462020565289887
312
+ - type: main_score
313
+ value: 29.232781114344697
314
+ - type: manhattan_pearson
315
+ value: 16.882446230243286
316
+ - type: manhattan_spearman
317
+ value: 17.06144091941576
318
+ - type: pearson
319
+ value: 29.06441922605839
320
+ - type: spearman
321
+ value: 29.232781114344697
322
+ task:
323
+ type: STS
324
+ - dataset:
325
+ config: es-en
326
+ name: MTEB STS17 (es-en)
327
+ revision: faeb762787bd10488a50c8b5be4a3b82e411949c
328
+ split: test
329
+ type: mteb/sts17-crosslingual-sts
330
+ metrics:
331
+ - type: cosine_pearson
332
+ value: 27.686316587339473
333
+ - type: cosine_spearman
334
+ value: 28.650995973102205
335
+ - type: euclidean_pearson
336
+ value: 12.954885279630565
337
+ - type: euclidean_spearman
338
+ value: 11.970815927480198
339
+ - type: main_score
340
+ value: 28.650995973102205
341
+ - type: manhattan_pearson
342
+ value: 12.079730127474948
343
+ - type: manhattan_spearman
344
+ value: 10.606967901984147
345
+ - type: pearson
346
+ value: 27.68631836666537
347
+ - type: spearman
348
+ value: 28.650995973102205
349
+ task:
350
+ type: STS
351
+ - dataset:
352
+ config: ar-ar
353
+ name: MTEB STS17 (ar-ar)
354
+ revision: faeb762787bd10488a50c8b5be4a3b82e411949c
355
+ split: test
356
+ type: mteb/sts17-crosslingual-sts
357
+ metrics:
358
+ - type: cosine_pearson
359
+ value: 84.12612492708037
360
+ - type: cosine_spearman
361
+ value: 84.24703763883515
362
+ - type: euclidean_pearson
363
+ value: 81.38085140113648
364
+ - type: euclidean_spearman
365
+ value: 83.17403450502965
366
+ - type: main_score
367
+ value: 84.24703763883515
368
+ - type: manhattan_pearson
369
+ value: 81.18466522597414
370
+ - type: manhattan_spearman
371
+ value: 82.61184409962614
372
+ - type: pearson
373
+ value: 84.12612546419625
374
+ - type: spearman
375
+ value: 84.25077492152536
376
+ task:
377
+ type: STS
378
+ - dataset:
379
+ config: it-en
380
+ name: MTEB STS17 (it-en)
381
+ revision: faeb762787bd10488a50c8b5be4a3b82e411949c
382
+ split: test
383
+ type: mteb/sts17-crosslingual-sts
384
+ metrics:
385
+ - type: cosine_pearson
386
+ value: 27.697680546701868
387
+ - type: cosine_spearman
388
+ value: 25.19277336255784
389
+ - type: euclidean_pearson
390
+ value: 13.964798090314115
391
+ - type: euclidean_spearman
392
+ value: 10.512169361528596
393
+ - type: main_score
394
+ value: 25.19277336255784
395
+ - type: manhattan_pearson
396
+ value: 13.537525485694433
397
+ - type: manhattan_spearman
398
+ value: 10.334001560105834
399
+ - type: pearson
400
+ value: 27.697681880242325
401
+ - type: spearman
402
+ value: 25.19277336255784
403
+ task:
404
+ type: STS
405
+ - dataset:
406
+ config: de-en
407
+ name: MTEB STS22.v2 (de-en)
408
+ revision: d31f33a128469b20e357535c39b82fb3c3f6f2bd
409
+ split: test
410
+ type: mteb/sts22-crosslingual-sts
411
+ metrics:
412
+ - type: cosine_pearson
413
+ value: 32.87548760760924
414
+ - type: cosine_spearman
415
+ value: 30.69782036694315
416
+ - type: euclidean_pearson
417
+ value: 29.925045225262142
418
+ - type: euclidean_spearman
419
+ value: 34.076021250318334
420
+ - type: main_score
421
+ value: 30.69782036694315
422
+ - type: manhattan_pearson
423
+ value: 30.815090565180945
424
+ - type: manhattan_spearman
425
+ value: 34.91615861045259
426
+ - type: pearson
427
+ value: 32.8754813614174
428
+ - type: spearman
429
+ value: 30.69782036694315
430
+ task:
431
+ type: STS
432
+ - dataset:
433
+ config: zh-en
434
+ name: MTEB STS22.v2 (zh-en)
435
+ revision: d31f33a128469b20e357535c39b82fb3c3f6f2bd
436
+ split: test
437
+ type: mteb/sts22-crosslingual-sts
438
+ metrics:
439
+ - type: cosine_pearson
440
+ value: 23.93269292232737
441
+ - type: cosine_spearman
442
+ value: 16.781461291066496
443
+ - type: euclidean_pearson
444
+ value: 20.87679825681155
445
+ - type: euclidean_spearman
446
+ value: 13.764510796592536
447
+ - type: main_score
448
+ value: 16.781461291066496
449
+ - type: manhattan_pearson
450
+ value: 23.416430850444588
451
+ - type: manhattan_spearman
452
+ value: 17.10405713909058
453
+ - type: pearson
454
+ value: 23.932682034899777
455
+ - type: spearman
456
+ value: 16.781461291066496
457
+ task:
458
+ type: STS
459
+ - dataset:
460
+ config: ar
461
+ name: MTEB STS22.v2 (ar)
462
+ revision: d31f33a128469b20e357535c39b82fb3c3f6f2bd
463
+ split: test
464
+ type: mteb/sts22-crosslingual-sts
465
+ metrics:
466
+ - type: cosine_pearson
467
+ value: 51.73784691362425
468
+ - type: cosine_spearman
469
+ value: 60.01035490847343
470
+ - type: euclidean_pearson
471
+ value: 52.717195602630305
472
+ - type: euclidean_spearman
473
+ value: 60.22164097529916
474
+ - type: main_score
475
+ value: 60.01035490847343
476
+ - type: manhattan_pearson
477
+ value: 53.04979941729716
478
+ - type: manhattan_spearman
479
+ value: 60.393100473647706
480
+ - type: pearson
481
+ value: 51.73784381247053
482
+ - type: spearman
483
+ value: 60.020906672817276
484
+ task:
485
+ type: STS
486
+ - dataset:
487
+ config: es-en
488
+ name: MTEB STS22.v2 (es-en)
489
+ revision: d31f33a128469b20e357535c39b82fb3c3f6f2bd
490
+ split: test
491
+ type: mteb/sts22-crosslingual-sts
492
+ metrics:
493
+ - type: cosine_pearson
494
+ value: 47.917244237624864
495
+ - type: cosine_spearman
496
+ value: 53.23173373821509
497
+ - type: euclidean_pearson
498
+ value: 48.172861539004636
499
+ - type: euclidean_spearman
500
+ value: 53.32970069145014
501
+ - type: main_score
502
+ value: 53.23173373821509
503
+ - type: manhattan_pearson
504
+ value: 48.163716825216646
505
+ - type: manhattan_spearman
506
+ value: 53.77963871495307
507
+ - type: pearson
508
+ value: 47.91724405724847
509
+ - type: spearman
510
+ value: 53.23173373821509
511
+ task:
512
+ type: STS
513
+ - dataset:
514
+ config: pl-en
515
+ name: MTEB STS22.v2 (pl-en)
516
+ revision: d31f33a128469b20e357535c39b82fb3c3f6f2bd
517
+ split: test
518
+ type: mteb/sts22-crosslingual-sts
519
+ metrics:
520
+ - type: cosine_pearson
521
+ value: 43.66748993183993
522
+ - type: cosine_spearman
523
+ value: 38.518248671828594
524
+ - type: euclidean_pearson
525
+ value: 50.475058499541134
526
+ - type: euclidean_spearman
527
+ value: 44.76070858743843
528
+ - type: main_score
529
+ value: 38.518248671828594
530
+ - type: manhattan_pearson
531
+ value: 50.576185727010014
532
+ - type: manhattan_spearman
533
+ value: 45.5306304403841
534
+ - type: pearson
535
+ value: 43.66750472144702
536
+ - type: spearman
537
+ value: 38.518248671828594
538
+ task:
539
+ type: STS
540
+ - dataset:
541
+ config: en
542
+ name: MTEB STS22.v2 (en)
543
+ revision: d31f33a128469b20e357535c39b82fb3c3f6f2bd
544
+ split: test
545
+ type: mteb/sts22-crosslingual-sts
546
+ metrics:
547
+ - type: cosine_pearson
548
+ value: 56.41373213565263
549
+ - type: cosine_spearman
550
+ value: 59.03774516602592
551
+ - type: euclidean_pearson
552
+ value: 54.173092638047294
553
+ - type: euclidean_spearman
554
+ value: 59.130444355085885
555
+ - type: main_score
556
+ value: 59.03774516602592
557
+ - type: manhattan_pearson
558
+ value: 54.18950361517434
559
+ - type: manhattan_spearman
560
+ value: 58.78927227383971
561
+ - type: pearson
562
+ value: 56.413733329868045
563
+ - type: spearman
564
+ value: 59.03774516602592
565
+ task:
566
+ type: STS
567
  license: apache-2.0
568
  language:
569
  - ar