File size: 10,480 Bytes
1fbbed1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
{"index":14,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-mistral-7b-instruct\">e5-mistral-7b-instruct<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Average":64.24,"GeoreviewClusteringP2P (rus-Cyrl)":76.32,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":62.27,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":54.13}
{"index":4,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/GritLM\/GritLM-7B\">GritLM-7B<\/a>","Model Size (Million Parameters)":7240,"Memory Usage (GB, fp32)":26.97,"Average":61.91,"GeoreviewClusteringP2P (rus-Cyrl)":74.06,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":60.01,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":51.66}
{"index":5,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/ai-forever\/ru-en-RoSBERTa\">ru-en-RoSBERTa<\/a>","Model Size (Million Parameters)":404,"Memory Usage (GB, fp32)":1.5,"Average":56.06,"GeoreviewClusteringP2P (rus-Cyrl)":65.42,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":55.47,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":47.29}
{"index":12,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/deepvk\/USER-bge-m3\">USER-bge-m3<\/a>","Model Size (Million Parameters)":359,"Memory Usage (GB, fp32)":1.34,"Average":53.61,"GeoreviewClusteringP2P (rus-Cyrl)":62.79,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":53.11,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":44.93}
{"index":11,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/deepvk\/USER-base\">USER-base<\/a>","Model Size (Million Parameters)":124,"Memory Usage (GB, fp32)":0.46,"Average":53.42,"GeoreviewClusteringP2P (rus-Cyrl)":64.16,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":51.38,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":44.73}
{"index":24,"Rank":6,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sergeyzh\/LaBSE-ru-turbo\">LaBSE-ru-turbo<\/a>","Model Size (Million Parameters)":128,"Memory Usage (GB, fp32)":0.48,"Average":53.22,"GeoreviewClusteringP2P (rus-Cyrl)":64.55,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":50.64,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":44.48}
{"index":0,"Rank":7,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-m3\">bge-m3<\/a>","Model Size (Million Parameters)":567,"Memory Usage (GB, fp32)":2.11,"Average":52.38,"GeoreviewClusteringP2P (rus-Cyrl)":63.09,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":50.83,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":43.21}
{"index":16,"Rank":8,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/multilingual-e5-large\">multilingual-e5-large<\/a>","Model Size (Million Parameters)":560,"Memory Usage (GB, fp32)":2.09,"Average":52.23,"GeoreviewClusteringP2P (rus-Cyrl)":59.59,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":51.98,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":45.12}
{"index":17,"Rank":9,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/multilingual-e5-small\">multilingual-e5-small<\/a>","Model Size (Million Parameters)":118,"Memory Usage (GB, fp32)":0.44,"Average":51.35,"GeoreviewClusteringP2P (rus-Cyrl)":58.57,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":51.14,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":44.33}
{"index":6,"Rank":10,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/ai-forever\/sbert_large_mt_nlu_ru\">sbert_large_mt_nlu_ru<\/a>","Model Size (Million Parameters)":427,"Memory Usage (GB, fp32)":1.59,"Average":51.29,"GeoreviewClusteringP2P (rus-Cyrl)":57.07,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":51.44,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":45.36}
{"index":7,"Rank":11,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/ai-forever\/sbert_large_nlu_ru\">sbert_large_nlu_ru<\/a>","Model Size (Million Parameters)":427,"Memory Usage (GB, fp32)":1.59,"Average":50.43,"GeoreviewClusteringP2P (rus-Cyrl)":57.12,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":49.7,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":44.48}
{"index":15,"Rank":12,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/multilingual-e5-base\">multilingual-e5-base<\/a>","Model Size (Million Parameters)":278,"Memory Usage (GB, fp32)":1.04,"Average":50.27,"GeoreviewClusteringP2P (rus-Cyrl)":54.46,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":51.56,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":44.79}
{"index":25,"Rank":13,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sergeyzh\/rubert-tiny-turbo\">rubert-tiny-turbo<\/a>","Model Size (Million Parameters)":29,"Memory Usage (GB, fp32)":0.11,"Average":49.57,"GeoreviewClusteringP2P (rus-Cyrl)":59.71,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":47.55,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":41.44}
{"index":23,"Rank":14,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/paraphrase-multilingual-mpnet-base-v2\">paraphrase-multilingual-mpnet-base-v2<\/a>","Model Size (Million Parameters)":278,"Memory Usage (GB, fp32)":1.04,"Average":49.18,"GeoreviewClusteringP2P (rus-Cyrl)":56.18,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":48.47,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":42.9}
{"index":22,"Rank":15,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/paraphrase-multilingual-MiniLM-L12-v2\">paraphrase-multilingual-MiniLM-L12-v2<\/a>","Model Size (Million Parameters)":118,"Memory Usage (GB, fp32)":0.44,"Average":47.76,"GeoreviewClusteringP2P (rus-Cyrl)":53.37,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":48.22,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":41.68}
{"index":18,"Rank":16,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/LaBSE\">LaBSE<\/a>","Model Size (Million Parameters)":471,"Memory Usage (GB, fp32)":1.75,"Average":47.74,"GeoreviewClusteringP2P (rus-Cyrl)":52.19,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":49.07,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":41.97}
{"index":8,"Rank":17,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/cointegrated\/LaBSE-en-ru\">LaBSE-en-ru<\/a>","Model Size (Million Parameters)":129,"Memory Usage (GB, fp32)":0.48,"Average":46.84,"GeoreviewClusteringP2P (rus-Cyrl)":51.89,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":47.48,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":41.16}
{"index":3,"Rank":18,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/DeepPavlov\/rubert-base-cased-sentence\">rubert-base-cased-sentence<\/a>","Model Size (Million Parameters)":180,"Memory Usage (GB, fp32)":0.67,"Average":43.13,"GeoreviewClusteringP2P (rus-Cyrl)":41.82,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":46.29,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":41.28}
{"index":13,"Rank":19,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/deepvk\/deberta-v1-base\">deberta-v1-base<\/a>","Model Size (Million Parameters)":124,"Memory Usage (GB, fp32)":0.46,"Average":42.92,"GeoreviewClusteringP2P (rus-Cyrl)":58.79,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":36.66,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":33.31}
{"index":10,"Rank":20,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/cointegrated\/rubert-tiny2\">rubert-tiny2<\/a>","Model Size (Million Parameters)":29,"Memory Usage (GB, fp32)":0.11,"Average":39.11,"GeoreviewClusteringP2P (rus-Cyrl)":41.58,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":39.78,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":35.98}
{"index":1,"Rank":21,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/DeepPavlov\/distilrubert-small-cased-conversational\">distilrubert-small-cased-conversational<\/a>","Model Size (Million Parameters)":106,"Memory Usage (GB, fp32)":0.39,"Average":38.41,"GeoreviewClusteringP2P (rus-Cyrl)":43.26,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":37.84,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":34.12}
{"index":9,"Rank":22,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/cointegrated\/rubert-tiny\">rubert-tiny<\/a>","Model Size (Million Parameters)":12,"Memory Usage (GB, fp32)":0.04,"Average":30.76,"GeoreviewClusteringP2P (rus-Cyrl)":34.4,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":29.89,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":27.98}
{"index":2,"Rank":23,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/DeepPavlov\/rubert-base-cased\">rubert-base-cased<\/a>","Model Size (Million Parameters)":180,"Memory Usage (GB, fp32)":0.67,"Average":27.91,"GeoreviewClusteringP2P (rus-Cyrl)":28.77,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":28.29,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":26.67}
{"index":21,"Rank":24,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-mpnet-base-v2\">all-mpnet-base-v2<\/a>","Model Size (Million Parameters)":110,"Memory Usage (GB, fp32)":0.41,"Average":15.83,"GeoreviewClusteringP2P (rus-Cyrl)":20.33,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":14.66,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":12.49}
{"index":19,"Rank":25,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-MiniLM-L12-v2\">all-MiniLM-L12-v2<\/a>","Model Size (Million Parameters)":33,"Memory Usage (GB, fp32)":0.12,"Average":13.78,"GeoreviewClusteringP2P (rus-Cyrl)":20.51,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":10.65,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":10.19}
{"index":20,"Rank":26,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-MiniLM-L6-v2\">all-MiniLM-L6-v2<\/a>","Model Size (Million Parameters)":23,"Memory Usage (GB, fp32)":0.09,"Average":13.3,"GeoreviewClusteringP2P (rus-Cyrl)":20.25,"RuSciBenchGRNTIClusteringP2P (rus-Cyrl)":10.21,"RuSciBenchOECDClusteringP2P (rus-Cyrl)":9.44}