Muennighoff's picture
Update
6f34120
raw
history blame
9 kB
{"index":0,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/GritLM\/GritLM-7B\">GritLM-7B<\/a>","Model Size (Million Parameters)":7240,"Memory Usage (GB, fp32)":26.97,"Embedding Dimensions":"","Max Tokens":4096,"BornholmBitextMining":61.17}
{"index":11,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-mistral-7b-instruct\">e5-mistral-7b-instruct<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"BornholmBitextMining":57.24}
{"index":15,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/multilingual-e5-large-instruct\">multilingual-e5-large-instruct<\/a>","Model Size (Million Parameters)":560,"Memory Usage (GB, fp32)":2.09,"Embedding Dimensions":1024,"Max Tokens":514,"BornholmBitextMining":55.42}
{"index":8,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/facebook\/SONAR\">SONAR<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","BornholmBitextMining":47.37}
{"index":20,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/LaBSE\">LaBSE<\/a>","Model Size (Million Parameters)":471,"Memory Usage (GB, fp32)":1.75,"Embedding Dimensions":768,"Max Tokens":512,"BornholmBitextMining":45.63}
{"index":16,"Rank":6,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/multilingual-e5-small\">multilingual-e5-small<\/a>","Model Size (Million Parameters)":118,"Memory Usage (GB, fp32)":0.44,"Embedding Dimensions":384,"Max Tokens":512,"BornholmBitextMining":43.89}
{"index":12,"Rank":7,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-small\">e5-small<\/a>","Model Size (Million Parameters)":33,"Memory Usage (GB, fp32)":0.12,"Embedding Dimensions":384,"Max Tokens":512,"BornholmBitextMining":40.27}
{"index":10,"Rank":8,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-large\">e5-large<\/a>","Model Size (Million Parameters)":335,"Memory Usage (GB, fp32)":1.25,"Embedding Dimensions":1024,"Max Tokens":512,"BornholmBitextMining":40.15}
{"index":9,"Rank":9,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-base\">e5-base<\/a>","Model Size (Million Parameters)":110,"Memory Usage (GB, fp32)":0.41,"Embedding Dimensions":768,"Max Tokens":512,"BornholmBitextMining":40.09}
{"index":1,"Rank":10,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Jechto\/e5-dansk-test-0.1\">e5-dansk-test-0.1<\/a>","Model Size (Million Parameters)":560,"Memory Usage (GB, fp32)":2.09,"Embedding Dimensions":1024,"Max Tokens":514,"BornholmBitextMining":37.97}
{"index":21,"Rank":11,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-MiniLM-L12-v2\">all-MiniLM-L12-v2<\/a>","Model Size (Million Parameters)":33,"Memory Usage (GB, fp32)":0.12,"Embedding Dimensions":384,"Max Tokens":512,"BornholmBitextMining":35.25}
{"index":13,"Rank":12,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/multilingual-e5-base\">multilingual-e5-base<\/a>","Model Size (Million Parameters)":278,"Memory Usage (GB, fp32)":1.04,"Embedding Dimensions":768,"Max Tokens":514,"BornholmBitextMining":33.22}
{"index":14,"Rank":13,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/multilingual-e5-large\">multilingual-e5-large<\/a>","Model Size (Million Parameters)":560,"Memory Usage (GB, fp32)":2.09,"Embedding Dimensions":1024,"Max Tokens":514,"BornholmBitextMining":29.87}
{"index":22,"Rank":14,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-MiniLM-L6-v2\">all-MiniLM-L6-v2<\/a>","Model Size (Million Parameters)":23,"Memory Usage (GB, fp32)":0.09,"Embedding Dimensions":384,"Max Tokens":512,"BornholmBitextMining":29.68}
{"index":23,"Rank":15,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-mpnet-base-v2\">all-mpnet-base-v2<\/a>","Model Size (Million Parameters)":110,"Memory Usage (GB, fp32)":0.41,"Embedding Dimensions":768,"Max Tokens":514,"BornholmBitextMining":27.44}
{"index":24,"Rank":16,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/paraphrase-multilingual-MiniLM-L12-v2\">paraphrase-multilingual-MiniLM-L12-v2<\/a>","Model Size (Million Parameters)":118,"Memory Usage (GB, fp32)":0.44,"Embedding Dimensions":384,"Max Tokens":512,"BornholmBitextMining":19.67}
{"index":25,"Rank":17,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/paraphrase-multilingual-mpnet-base-v2\">paraphrase-multilingual-mpnet-base-v2<\/a>","Model Size (Million Parameters)":278,"Memory Usage (GB, fp32)":1.04,"Embedding Dimensions":768,"Max Tokens":514,"BornholmBitextMining":18.18}
{"index":4,"Rank":18,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/KBLab\/sentence-bert-swedish-cased\">sentence-bert-swedish-cased<\/a>","Model Size (Million Parameters)":125,"Memory Usage (GB, fp32)":0.47,"Embedding Dimensions":768,"Max Tokens":512,"BornholmBitextMining":14.08}
{"index":7,"Rank":19,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/chcaa\/dfm-encoder-large-v1\">dfm-encoder-large-v1<\/a>","Model Size (Million Parameters)":355,"Memory Usage (GB, fp32)":1.32,"Embedding Dimensions":1024,"Max Tokens":512,"BornholmBitextMining":11.65}
{"index":5,"Rank":20,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/NbAiLab\/nb-bert-base\">nb-bert-base<\/a>","Model Size (Million Parameters)":179,"Memory Usage (GB, fp32)":0.67,"Embedding Dimensions":768,"Max Tokens":512,"BornholmBitextMining":9.88}
{"index":2,"Rank":21,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/KB\/bert-base-swedish-cased\">bert-base-swedish-cased<\/a>","Model Size (Million Parameters)":125,"Memory Usage (GB, fp32)":0.47,"Embedding Dimensions":768,"Max Tokens":512,"BornholmBitextMining":6.6}
{"index":26,"Rank":22,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/vesteinn\/DanskBERT\">DanskBERT<\/a>","Model Size (Million Parameters)":125,"Memory Usage (GB, fp32)":0.47,"Embedding Dimensions":768,"Max Tokens":514,"BornholmBitextMining":6.34}
{"index":18,"Rank":23,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/ltg\/norbert3-base\">norbert3-base<\/a>","Model Size (Million Parameters)":131,"Memory Usage (GB, fp32)":0.49,"Embedding Dimensions":768,"Max Tokens":512,"BornholmBitextMining":6.08}
{"index":6,"Rank":24,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/NbAiLab\/nb-bert-large\">nb-bert-large<\/a>","Model Size (Million Parameters)":355,"Memory Usage (GB, fp32)":1.32,"Embedding Dimensions":1024,"Max Tokens":512,"BornholmBitextMining":4.53}
{"index":27,"Rank":25,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/xlm-roberta-base\">xlm-roberta-base<\/a>","Model Size (Million Parameters)":279,"Memory Usage (GB, fp32)":1.04,"Embedding Dimensions":768,"Max Tokens":514,"BornholmBitextMining":4.42}
{"index":19,"Rank":26,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/ltg\/norbert3-large\">norbert3-large<\/a>","Model Size (Million Parameters)":368,"Memory Usage (GB, fp32)":1.37,"Embedding Dimensions":1024,"Max Tokens":512,"BornholmBitextMining":2.9}
{"index":17,"Rank":27,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/jonfd\/electra-small-nordic\">electra-small-nordic<\/a>","Model Size (Million Parameters)":23,"Memory Usage (GB, fp32)":0.09,"Embedding Dimensions":256,"Max Tokens":512,"BornholmBitextMining":1.44}
{"index":3,"Rank":28,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/KBLab\/electra-small-swedish-cased-discriminator\">electra-small-swedish-cased-discriminator<\/a>","Model Size (Million Parameters)":16,"Memory Usage (GB, fp32)":0.06,"Embedding Dimensions":256,"Max Tokens":512,"BornholmBitextMining":0.85}