orionweller commited on
Commit
d51bafc
1 Parent(s): 71544e2

Automated Leaderboard Update

Browse files
all_data_tasks/4/default.jsonl CHANGED
The diff for this file is too large to render. See raw diff
 
boards_data/en/data_overall/default.jsonl CHANGED
@@ -187,7 +187,7 @@
187
  {"index":93,"Rank":198,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Pekarnick\/e5-large-v2-Q4_K_M-GGUF\">e5-large-v2-Q4_K_M-GGUF<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (56 datasets)":"","Classification Average (12 datasets)":75.24,"Clustering Average (11 datasets)":44.49,"PairClassification Average (3 datasets)":86.03,"Reranking Average (4 datasets)":56.61,"Retrieval Average (15 datasets)":"","STS Average (10 datasets)":82.05,"Summarization Average (1 datasets)":30.19}
188
  {"index":97,"Rank":200,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Shimin\/LLaMA-embeeding\">LLaMA-embeeding<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (56 datasets)":"","Classification Average (12 datasets)":"","Clustering Average (11 datasets)":"","PairClassification Average (3 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (15 datasets)":"","STS Average (10 datasets)":"","Summarization Average (1 datasets)":30.62}
189
  {"index":98,"Rank":201,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Shimin\/yiyouliao\">yiyouliao<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (56 datasets)":"","Classification Average (12 datasets)":"","Clustering Average (11 datasets)":"","PairClassification Average (3 datasets)":79.84,"Reranking Average (4 datasets)":"","Retrieval Average (15 datasets)":"","STS Average (10 datasets)":"","Summarization Average (1 datasets)":32.47}
190
- {"index":102,"Rank":202,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Snowflake\/snowflake-arctic-embed-m-v1.5\">snowflake-arctic-embed-m-v1.5<\/a>","Model Size (Million Parameters)":109,"Memory Usage (GB, fp32)":0.41,"Embedding Dimensions":768,"Max Tokens":512,"Average (56 datasets)":"","Classification Average (12 datasets)":"","Clustering Average (11 datasets)":"","PairClassification Average (3 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (15 datasets)":"","STS Average (10 datasets)":"","Summarization Average (1 datasets)":""}
191
  {"index":109,"Rank":203,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Wissam42\/sentence-croissant-llm-base\">sentence-croissant-llm-base<\/a>","Model Size (Million Parameters)":1280,"Memory Usage (GB, fp32)":4.77,"Embedding Dimensions":2048,"Max Tokens":2048,"Average (56 datasets)":"","Classification Average (12 datasets)":"","Clustering Average (11 datasets)":"","PairClassification Average (3 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (15 datasets)":"","STS Average (10 datasets)":"","Summarization Average (1 datasets)":""}
192
  {"index":110,"Rank":204,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/aari1995\/German_Semantic_STS_V2\">German_Semantic_STS_V2<\/a>","Model Size (Million Parameters)":336,"Memory Usage (GB, fp32)":1.25,"Embedding Dimensions":1024,"Max Tokens":512,"Average (56 datasets)":"","Classification Average (12 datasets)":"","Clustering Average (11 datasets)":"","PairClassification Average (3 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (15 datasets)":"","STS Average (10 datasets)":"","Summarization Average (1 datasets)":""}
193
  {"index":111,"Rank":205,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/agier9\/UAE-Large-V1-Q5_K_S-GGUF\">UAE-Large-V1-Q5_K_S-GGUF<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (56 datasets)":"","Classification Average (12 datasets)":75.58,"Clustering Average (11 datasets)":46.73,"PairClassification Average (3 datasets)":87.25,"Reranking Average (4 datasets)":59.88,"Retrieval Average (15 datasets)":"","STS Average (10 datasets)":84.54,"Summarization Average (1 datasets)":32.03}
 
187
  {"index":93,"Rank":198,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Pekarnick\/e5-large-v2-Q4_K_M-GGUF\">e5-large-v2-Q4_K_M-GGUF<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (56 datasets)":"","Classification Average (12 datasets)":75.24,"Clustering Average (11 datasets)":44.49,"PairClassification Average (3 datasets)":86.03,"Reranking Average (4 datasets)":56.61,"Retrieval Average (15 datasets)":"","STS Average (10 datasets)":82.05,"Summarization Average (1 datasets)":30.19}
188
  {"index":97,"Rank":200,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Shimin\/LLaMA-embeeding\">LLaMA-embeeding<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (56 datasets)":"","Classification Average (12 datasets)":"","Clustering Average (11 datasets)":"","PairClassification Average (3 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (15 datasets)":"","STS Average (10 datasets)":"","Summarization Average (1 datasets)":30.62}
189
  {"index":98,"Rank":201,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Shimin\/yiyouliao\">yiyouliao<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (56 datasets)":"","Classification Average (12 datasets)":"","Clustering Average (11 datasets)":"","PairClassification Average (3 datasets)":79.84,"Reranking Average (4 datasets)":"","Retrieval Average (15 datasets)":"","STS Average (10 datasets)":"","Summarization Average (1 datasets)":32.47}
190
+ {"index":102,"Rank":202,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Snowflake\/snowflake-arctic-embed-m-v1.5\">snowflake-arctic-embed-m-v1.5<\/a>","Model Size (Million Parameters)":109,"Memory Usage (GB, fp32)":0.41,"Embedding Dimensions":768,"Max Tokens":512,"Average (56 datasets)":"","Classification Average (12 datasets)":"","Clustering Average (11 datasets)":"","PairClassification Average (3 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (15 datasets)":55.14,"STS Average (10 datasets)":"","Summarization Average (1 datasets)":""}
191
  {"index":109,"Rank":203,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Wissam42\/sentence-croissant-llm-base\">sentence-croissant-llm-base<\/a>","Model Size (Million Parameters)":1280,"Memory Usage (GB, fp32)":4.77,"Embedding Dimensions":2048,"Max Tokens":2048,"Average (56 datasets)":"","Classification Average (12 datasets)":"","Clustering Average (11 datasets)":"","PairClassification Average (3 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (15 datasets)":"","STS Average (10 datasets)":"","Summarization Average (1 datasets)":""}
192
  {"index":110,"Rank":204,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/aari1995\/German_Semantic_STS_V2\">German_Semantic_STS_V2<\/a>","Model Size (Million Parameters)":336,"Memory Usage (GB, fp32)":1.25,"Embedding Dimensions":1024,"Max Tokens":512,"Average (56 datasets)":"","Classification Average (12 datasets)":"","Clustering Average (11 datasets)":"","PairClassification Average (3 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (15 datasets)":"","STS Average (10 datasets)":"","Summarization Average (1 datasets)":""}
193
  {"index":111,"Rank":205,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/agier9\/UAE-Large-V1-Q5_K_S-GGUF\">UAE-Large-V1-Q5_K_S-GGUF<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (56 datasets)":"","Classification Average (12 datasets)":75.58,"Clustering Average (11 datasets)":46.73,"PairClassification Average (3 datasets)":87.25,"Reranking Average (4 datasets)":59.88,"Retrieval Average (15 datasets)":"","STS Average (10 datasets)":84.54,"Summarization Average (1 datasets)":32.03}
boards_data/en/data_tasks/Retrieval/default.jsonl CHANGED
The diff for this file is too large to render. See raw diff