Muennighoff commited on
Commit
f45efd6
1 Parent(s): 16a0ce7

Add RAR-b LB

Browse files
EXTERNAL_MODEL_RESULTS.json CHANGED
The diff for this file is too large to render. See raw diff
 
all_data_tasks/0/default.jsonl CHANGED
@@ -1,14 +1,29 @@
1
- {"index":4,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-7B-instruct\">gte-Qwen2-7B-instruct<\/a>","Model Size (Million Parameters)":7613,"Memory Usage (GB, fp32)":"28.36","Average":22.38,"BrightRetrieval (aops)":15.1,"BrightRetrieval (biology)":32.09,"BrightRetrieval (earth_science)":40.66,"BrightRetrieval (economics)":16.18,"BrightRetrieval (leetcode)":31.07,"BrightRetrieval (pony)":1.25,"BrightRetrieval (psychology)":26.58,"BrightRetrieval (robotics)":12.82,"BrightRetrieval (stackoverflow)":13.95,"BrightRetrieval (sustainable_living)":20.82,"BrightRetrieval (theoremqa_questions)":29.9,"BrightRetrieval (theoremqa_theorems)":28.15}
2
- {"index":3,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen1.5-7B-instruct\">gte-Qwen1.5-7B-instruct<\/a>","Model Size (Million Parameters)":7099,"Memory Usage (GB, fp32)":"26.45","Average":21.75,"BrightRetrieval (aops)":14.36,"BrightRetrieval (biology)":30.92,"BrightRetrieval (earth_science)":36.22,"BrightRetrieval (economics)":17.72,"BrightRetrieval (leetcode)":25.46,"BrightRetrieval (pony)":9.79,"BrightRetrieval (psychology)":24.61,"BrightRetrieval (robotics)":13.47,"BrightRetrieval (stackoverflow)":19.85,"BrightRetrieval (sustainable_living)":14.93,"BrightRetrieval (theoremqa_questions)":26.97,"BrightRetrieval (theoremqa_theorems)":26.66}
3
- {"index":7,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/GritLM\/GritLM-7B\">GritLM-7B<\/a>","Model Size (Million Parameters)":7240,"Memory Usage (GB, fp32)":"26.97","Average":20.43,"BrightRetrieval (aops)":8.91,"BrightRetrieval (biology)":25.04,"BrightRetrieval (earth_science)":32.77,"BrightRetrieval (economics)":19.0,"BrightRetrieval (leetcode)":29.85,"BrightRetrieval (pony)":21.98,"BrightRetrieval (psychology)":19.92,"BrightRetrieval (robotics)":17.31,"BrightRetrieval (stackoverflow)":11.62,"BrightRetrieval (sustainable_living)":18.04,"BrightRetrieval (theoremqa_questions)":23.34,"BrightRetrieval (theoremqa_theorems)":17.41}
4
- {"index":0,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/cloud.google.com\/vertex-ai\/generative-ai\/docs\/embeddings\/get-text-embeddings#latest_models\">google-gecko.text-embedding-preview-0409<\/a>","Model Size (Million Parameters)":1200,"Memory Usage (GB, fp32)":"4.47","Average":19.73,"BrightRetrieval (aops)":9.33,"BrightRetrieval (biology)":22.98,"BrightRetrieval (earth_science)":34.38,"BrightRetrieval (economics)":19.5,"BrightRetrieval (leetcode)":29.64,"BrightRetrieval (pony)":3.59,"BrightRetrieval (psychology)":27.86,"BrightRetrieval (robotics)":15.98,"BrightRetrieval (stackoverflow)":17.93,"BrightRetrieval (sustainable_living)":17.25,"BrightRetrieval (theoremqa_questions)":21.51,"BrightRetrieval (theoremqa_theorems)":16.77}
5
- {"index":10,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/hkunlp\/instructor-xl\">instructor-xl<\/a>","Model Size (Million Parameters)":1241,"Memory Usage (GB, fp32)":"4.62","Average":18.64,"BrightRetrieval (aops)":8.26,"BrightRetrieval (biology)":21.91,"BrightRetrieval (earth_science)":34.35,"BrightRetrieval (economics)":22.81,"BrightRetrieval (leetcode)":27.5,"BrightRetrieval (pony)":5.02,"BrightRetrieval (psychology)":27.43,"BrightRetrieval (robotics)":17.39,"BrightRetrieval (stackoverflow)":19.06,"BrightRetrieval (sustainable_living)":18.82,"BrightRetrieval (theoremqa_questions)":14.59,"BrightRetrieval (theoremqa_theorems)":6.5}
6
- {"index":8,"Rank":6,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Salesforce\/SFR-Embedding-Mistral\">SFR-Embedding-Mistral<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":"26.49","Average":18.0,"BrightRetrieval (aops)":7.43,"BrightRetrieval (biology)":19.49,"BrightRetrieval (earth_science)":26.63,"BrightRetrieval (economics)":17.84,"BrightRetrieval (leetcode)":27.35,"BrightRetrieval (pony)":1.97,"BrightRetrieval (psychology)":18.97,"BrightRetrieval (robotics)":16.7,"BrightRetrieval (stackoverflow)":12.72,"BrightRetrieval (sustainable_living)":19.79,"BrightRetrieval (theoremqa_questions)":23.05,"BrightRetrieval (theoremqa_theorems)":24.05}
7
- {"index":1,"Rank":7,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.voyageai.com\/embeddings\/\">voyage-large-2-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":17.57,"BrightRetrieval (aops)":7.45,"BrightRetrieval (biology)":23.55,"BrightRetrieval (earth_science)":25.09,"BrightRetrieval (economics)":19.85,"BrightRetrieval (leetcode)":30.6,"BrightRetrieval (pony)":1.48,"BrightRetrieval (psychology)":24.79,"BrightRetrieval (robotics)":11.21,"BrightRetrieval (stackoverflow)":15.03,"BrightRetrieval (sustainable_living)":15.58,"BrightRetrieval (theoremqa_questions)":26.06,"BrightRetrieval (theoremqa_theorems)":10.13}
8
- {"index":13,"Rank":8,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-embedding-models-and-api-updates\">text-embedding-3-large<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":17.43,"BrightRetrieval (aops)":8.45,"BrightRetrieval (biology)":23.67,"BrightRetrieval (earth_science)":26.27,"BrightRetrieval (economics)":19.98,"BrightRetrieval (leetcode)":23.65,"BrightRetrieval (pony)":2.45,"BrightRetrieval (psychology)":27.52,"BrightRetrieval (robotics)":12.93,"BrightRetrieval (stackoverflow)":12.49,"BrightRetrieval (sustainable_living)":20.32,"BrightRetrieval (theoremqa_questions)":22.22,"BrightRetrieval (theoremqa_theorems)":9.25}
9
- {"index":11,"Rank":9,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-mistral-7b-instruct\">e5-mistral-7b-instruct<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":"26.49","Average":17.43,"BrightRetrieval (aops)":7.1,"BrightRetrieval (biology)":18.84,"BrightRetrieval (earth_science)":25.96,"BrightRetrieval (economics)":15.49,"BrightRetrieval (leetcode)":28.72,"BrightRetrieval (pony)":4.81,"BrightRetrieval (psychology)":15.79,"BrightRetrieval (robotics)":16.37,"BrightRetrieval (stackoverflow)":9.83,"BrightRetrieval (sustainable_living)":18.51,"BrightRetrieval (theoremqa_questions)":23.94,"BrightRetrieval (theoremqa_theorems)":23.78}
10
- {"index":6,"Rank":10,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Cohere\/Cohere-embed-english-v3.0\">Cohere-embed-english-v3.0<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":16.24,"BrightRetrieval (aops)":6.46,"BrightRetrieval (biology)":18.98,"BrightRetrieval (earth_science)":27.45,"BrightRetrieval (economics)":20.18,"BrightRetrieval (leetcode)":26.78,"BrightRetrieval (pony)":1.77,"BrightRetrieval (psychology)":21.82,"BrightRetrieval (robotics)":16.21,"BrightRetrieval (stackoverflow)":16.47,"BrightRetrieval (sustainable_living)":17.69,"BrightRetrieval (theoremqa_questions)":15.07,"BrightRetrieval (theoremqa_theorems)":6.04}
11
- {"index":12,"Rank":11,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-mpnet-base-v2\">all-mpnet-base-v2<\/a>","Model Size (Million Parameters)":110,"Memory Usage (GB, fp32)":"0.41","Average":14.8,"BrightRetrieval (aops)":5.32,"BrightRetrieval (biology)":15.52,"BrightRetrieval (earth_science)":20.11,"BrightRetrieval (economics)":16.64,"BrightRetrieval (leetcode)":26.4,"BrightRetrieval (pony)":6.95,"BrightRetrieval (psychology)":22.63,"BrightRetrieval (robotics)":8.36,"BrightRetrieval (stackoverflow)":9.48,"BrightRetrieval (sustainable_living)":15.34,"BrightRetrieval (theoremqa_questions)":18.49,"BrightRetrieval (theoremqa_theorems)":12.38}
12
- {"index":2,"Rank":12,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/en.wikipedia.org\/wiki\/Okapi_BM25\">bm25<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":14.29,"BrightRetrieval (aops)":6.2,"BrightRetrieval (biology)":19.19,"BrightRetrieval (earth_science)":27.06,"BrightRetrieval (economics)":14.87,"BrightRetrieval (leetcode)":24.37,"BrightRetrieval (pony)":7.93,"BrightRetrieval (psychology)":12.51,"BrightRetrieval (robotics)":13.53,"BrightRetrieval (stackoverflow)":16.55,"BrightRetrieval (sustainable_living)":15.22,"BrightRetrieval (theoremqa_questions)":9.78,"BrightRetrieval (theoremqa_theorems)":4.25}
13
- {"index":9,"Rank":13,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/hkunlp\/instructor-large\">instructor-large<\/a>","Model Size (Million Parameters)":335,"Memory Usage (GB, fp32)":"1.25","Average":14.12,"BrightRetrieval (aops)":7.94,"BrightRetrieval (biology)":15.61,"BrightRetrieval (earth_science)":21.52,"BrightRetrieval (economics)":15.99,"BrightRetrieval (leetcode)":20.0,"BrightRetrieval (pony)":1.32,"BrightRetrieval (psychology)":21.94,"BrightRetrieval (robotics)":11.45,"BrightRetrieval (stackoverflow)":11.21,"BrightRetrieval (sustainable_living)":13.16,"BrightRetrieval (theoremqa_questions)":20.07,"BrightRetrieval (theoremqa_theorems)":9.29}
14
- {"index":5,"Rank":14,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-large-en-v1.5\">bge-large-en-v1.5<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":13.47,"BrightRetrieval (aops)":6.08,"BrightRetrieval (biology)":11.96,"BrightRetrieval (earth_science)":24.15,"BrightRetrieval (economics)":16.59,"BrightRetrieval (leetcode)":26.68,"BrightRetrieval (pony)":5.64,"BrightRetrieval (psychology)":17.44,"BrightRetrieval (robotics)":12.21,"BrightRetrieval (stackoverflow)":9.51,"BrightRetrieval (sustainable_living)":13.27,"BrightRetrieval (theoremqa_questions)":12.56,"BrightRetrieval (theoremqa_theorems)":5.51}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"index":13,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/GritLM\/GritLM-7B\">GritLM-7B<\/a>","Model Size (Million Parameters)":7240,"Memory Usage (GB, fp32)":26.97,"Average":35.2,"ARCChallenge":26.68,"AlphaNLI":34.0,"HellaSwag":39.45,"PIQA":44.35,"Quail":11.69,"RARbCode":84.0,"RARbMath":82.35,"SIQA":7.23,"SpartQA":9.29,"TempReasonL1":7.15,"TempReasonL2Fact":58.38,"TempReasonL2Pure":11.22,"TempReasonL3Fact":44.29,"TempReasonL3Pure":14.15,"WinoGrande":53.74}
2
+ {"index":25,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-embedding-models-and-api-updates\">text-embedding-3-large-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":31.13,"ARCChallenge":21.22,"AlphaNLI":34.23,"HellaSwag":31.4,"PIQA":37.52,"Quail":13.6,"RARbCode":89.41,"RARbMath":87.73,"SIQA":4.99,"SpartQA":7.45,"TempReasonL1":2.07,"TempReasonL2Fact":39.77,"TempReasonL2Pure":11.04,"TempReasonL3Fact":37.04,"TempReasonL3Pure":15.51,"WinoGrande":33.92}
3
+ {"index":12,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/GritLM\/GritLM-7B\">GritLM-7B-noinstruct<\/a>","Model Size (Million Parameters)":7240,"Memory Usage (GB, fp32)":26.97,"Average":30.57,"ARCChallenge":16.57,"AlphaNLI":29.56,"HellaSwag":36.03,"PIQA":35.8,"Quail":8.68,"RARbCode":83.14,"RARbMath":83.01,"SIQA":5.73,"SpartQA":1.56,"TempReasonL1":2.57,"TempReasonL2Fact":48.25,"TempReasonL2Pure":8.98,"TempReasonL3Fact":34.11,"TempReasonL3Pure":12.44,"WinoGrande":52.12}
4
+ {"index":26,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-embedding-models-and-api-updates\">text-embedding-3-large<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":29.95,"ARCChallenge":23.98,"AlphaNLI":37.27,"HellaSwag":34.12,"PIQA":41.96,"Quail":10.15,"RARbCode":89.64,"RARbMath":90.08,"SIQA":3.44,"SpartQA":7.51,"TempReasonL1":2.13,"TempReasonL2Fact":28.65,"TempReasonL2Pure":10.34,"TempReasonL3Fact":25.52,"TempReasonL3Pure":15.28,"WinoGrande":29.11}
5
+ {"index":16,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-mistral-7b-instruct\">e5-mistral-7b-instruct<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Average":28.41,"ARCChallenge":17.81,"AlphaNLI":26.12,"HellaSwag":34.85,"PIQA":39.37,"Quail":7.01,"RARbCode":78.46,"RARbMath":72.16,"SIQA":5.42,"SpartQA":9.92,"TempReasonL1":3.31,"TempReasonL2Fact":36.9,"TempReasonL2Pure":9.18,"TempReasonL3Fact":30.18,"TempReasonL3Pure":14.31,"WinoGrande":41.21}
6
+ {"index":17,"Rank":6,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-mistral-7b-instruct-noinstruct\">e5-mistral-7b-instruct-noinstruct<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Average":28.04,"ARCChallenge":20.48,"AlphaNLI":18.88,"HellaSwag":32.25,"PIQA":32.8,"Quail":6.25,"RARbCode":79.84,"RARbMath":76.19,"SIQA":5.08,"SpartQA":10.87,"TempReasonL1":3.04,"TempReasonL2Fact":35.63,"TempReasonL2Pure":9.32,"TempReasonL3Fact":30.41,"TempReasonL3Pure":14.39,"WinoGrande":45.18}
7
+ {"index":10,"Rank":7,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Cohere\/Cohere-embed-english-v3.0\">Cohere-embed-english-v3.0-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":25.41,"ARCChallenge":10.1,"AlphaNLI":18.75,"HellaSwag":29.02,"PIQA":27.89,"Quail":7.77,"RARbCode":56.56,"RARbMath":72.05,"SIQA":5.03,"SpartQA":3.33,"TempReasonL1":1.43,"TempReasonL2Fact":40.46,"TempReasonL2Pure":2.39,"TempReasonL3Fact":33.87,"TempReasonL3Pure":7.52,"WinoGrande":65.02}
8
+ {"index":28,"Rank":8,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-embedding-models-and-api-updates\">text-embedding-3-small<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":24.2,"ARCChallenge":14.63,"AlphaNLI":30.61,"HellaSwag":30.94,"PIQA":33.69,"Quail":6.11,"RARbCode":72.03,"RARbMath":71.07,"SIQA":3.03,"SpartQA":6.63,"TempReasonL1":2.35,"TempReasonL2Fact":25.68,"TempReasonL2Pure":2.76,"TempReasonL3Fact":22.09,"TempReasonL3Pure":9.79,"WinoGrande":31.53}
9
+ {"index":11,"Rank":9,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Cohere\/Cohere-embed-english-v3.0\">Cohere-embed-english-v3.0<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":23.65,"ARCChallenge":9.89,"AlphaNLI":15.1,"HellaSwag":26.35,"PIQA":28.49,"Quail":4.1,"RARbCode":57.19,"RARbMath":72.26,"SIQA":4.26,"SpartQA":3.75,"TempReasonL1":1.5,"TempReasonL2Fact":35.91,"TempReasonL2Pure":1.89,"TempReasonL3Fact":27.51,"TempReasonL3Pure":8.53,"WinoGrande":58.01}
10
+ {"index":24,"Rank":10,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-and-improved-embedding-model\">text-embedding-ada-002<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":22.57,"ARCChallenge":13.3,"AlphaNLI":25.65,"HellaSwag":29.29,"PIQA":31.02,"Quail":5.83,"RARbCode":83.39,"RARbMath":73.21,"SIQA":3.14,"SpartQA":4.23,"TempReasonL1":1.68,"TempReasonL2Fact":19.93,"TempReasonL2Pure":2.6,"TempReasonL3Fact":18.02,"TempReasonL3Pure":7.58,"WinoGrande":19.65}
11
+ {"index":27,"Rank":11,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-embedding-models-and-api-updates\">text-embedding-3-small-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":22.09,"ARCChallenge":13.76,"AlphaNLI":21.14,"HellaSwag":27.2,"PIQA":29.59,"Quail":6.64,"RARbCode":72.14,"RARbMath":64.31,"SIQA":2.98,"SpartQA":3.58,"TempReasonL1":2.29,"TempReasonL2Fact":26.34,"TempReasonL2Pure":3.17,"TempReasonL3Fact":22.72,"TempReasonL3Pure":9.98,"WinoGrande":25.49}
12
+ {"index":7,"Rank":12,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-m3\">bge-m3<\/a>","Model Size (Million Parameters)":2270,"Memory Usage (GB, fp32)":8.46,"Average":21.48,"ARCChallenge":9.02,"AlphaNLI":24.73,"HellaSwag":25.67,"PIQA":22.93,"Quail":7.51,"RARbCode":38.8,"RARbMath":69.19,"SIQA":4.89,"SpartQA":7.49,"TempReasonL1":0.99,"TempReasonL2Fact":33.23,"TempReasonL2Pure":0.68,"TempReasonL3Fact":30.05,"TempReasonL3Pure":5.28,"WinoGrande":41.72}
13
+ {"index":6,"Rank":13,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-m3\">bge-m3-instruct<\/a>","Model Size (Million Parameters)":2270,"Memory Usage (GB, fp32)":8.46,"Average":20.83,"ARCChallenge":9.03,"AlphaNLI":24.69,"HellaSwag":25.55,"PIQA":19.03,"Quail":7.08,"RARbCode":39.58,"RARbMath":64.51,"SIQA":4.77,"SpartQA":7.0,"TempReasonL1":0.8,"TempReasonL2Fact":34.99,"TempReasonL2Pure":0.62,"TempReasonL3Fact":32.47,"TempReasonL3Pure":7.01,"WinoGrande":35.33}
14
+ {"index":20,"Rank":14,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-MiniLM-L6-v2\">all-MiniLM-L6-v2<\/a>","Model Size (Million Parameters)":23,"Memory Usage (GB, fp32)":0.09,"Average":19.61,"ARCChallenge":9.48,"AlphaNLI":28.19,"HellaSwag":24.21,"PIQA":25.28,"Quail":3.92,"RARbCode":44.27,"RARbMath":68.19,"SIQA":1.56,"SpartQA":1.65,"TempReasonL1":1.53,"TempReasonL2Fact":17.65,"TempReasonL2Pure":0.46,"TempReasonL3Fact":14.16,"TempReasonL3Pure":6.33,"WinoGrande":47.33}
15
+ {"index":23,"Rank":15,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-and-improved-embedding-model\">text-embedding-ada-002-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":19.56,"ARCChallenge":11.85,"AlphaNLI":10.62,"HellaSwag":24.8,"PIQA":23.87,"Quail":5.79,"RARbCode":82.36,"RARbMath":67.26,"SIQA":2.64,"SpartQA":4.75,"TempReasonL1":1.44,"TempReasonL2Fact":19.38,"TempReasonL2Pure":2.43,"TempReasonL3Fact":17.58,"TempReasonL3Pure":7.31,"WinoGrande":11.36}
16
+ {"index":1,"Rank":16,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/github.com\/facebookresearch\/dpr-scale\/tree\/main\/dragon\">dragon-plus<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":19.1,"ARCChallenge":8.91,"AlphaNLI":32.1,"HellaSwag":27.69,"PIQA":28.01,"Quail":4.09,"RARbCode":17.58,"RARbMath":45.09,"SIQA":2.0,"SpartQA":10.34,"TempReasonL1":1.82,"TempReasonL2Fact":17.45,"TempReasonL2Pure":0.55,"TempReasonL3Fact":15.71,"TempReasonL3Pure":7.97,"WinoGrande":67.18}
17
+ {"index":22,"Rank":17,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-mpnet-base-v2\">all-mpnet-base-v2<\/a>","Model Size (Million Parameters)":110,"Memory Usage (GB, fp32)":0.41,"Average":18.03,"ARCChallenge":11.8,"AlphaNLI":22.41,"HellaSwag":26.27,"PIQA":29.03,"Quail":3.41,"RARbCode":53.21,"RARbMath":71.85,"SIQA":2.38,"SpartQA":0.22,"TempReasonL1":1.77,"TempReasonL2Fact":11.2,"TempReasonL2Pure":1.15,"TempReasonL3Fact":9.42,"TempReasonL3Pure":5.59,"WinoGrande":20.8}
18
+ {"index":5,"Rank":18,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-large-en-v1.5\">bge-large-en-v1.5<\/a>","Model Size (Million Parameters)":1340,"Memory Usage (GB, fp32)":4.99,"Average":17.7,"ARCChallenge":9.99,"AlphaNLI":13.13,"HellaSwag":28.5,"PIQA":27.99,"Quail":1.83,"RARbCode":48.12,"RARbMath":57.36,"SIQA":1.04,"SpartQA":2.99,"TempReasonL1":1.46,"TempReasonL2Fact":24.25,"TempReasonL2Pure":2.35,"TempReasonL3Fact":20.64,"TempReasonL3Pure":6.67,"WinoGrande":19.18}
19
+ {"index":18,"Rank":19,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-MiniLM-L12-v2\">all-MiniLM-L12-v2<\/a>","Model Size (Million Parameters)":33,"Memory Usage (GB, fp32)":0.12,"Average":17.35,"ARCChallenge":10.23,"AlphaNLI":25.35,"HellaSwag":24.08,"PIQA":26.44,"Quail":3.08,"RARbCode":42.44,"RARbMath":66.36,"SIQA":2.09,"SpartQA":2.67,"TempReasonL1":1.66,"TempReasonL2Fact":10.31,"TempReasonL2Pure":0.63,"TempReasonL3Fact":11.11,"TempReasonL3Pure":6.63,"WinoGrande":27.2}
20
+ {"index":0,"Rank":20,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/github.com\/facebookresearch\/dpr-scale\/tree\/main\/dragon\">dragon-plus-instruct<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":16.73,"ARCChallenge":8.24,"AlphaNLI":25.18,"HellaSwag":24.06,"PIQA":26.35,"Quail":4.2,"RARbCode":12.84,"RARbMath":36.15,"SIQA":1.75,"SpartQA":10.82,"TempReasonL1":1.54,"TempReasonL2Fact":16.11,"TempReasonL2Pure":0.57,"TempReasonL3Fact":14.81,"TempReasonL3Pure":7.46,"WinoGrande":60.84}
21
+ {"index":19,"Rank":21,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-MiniLM-L6-v2\">all-MiniLM-L6-v2-instruct<\/a>","Model Size (Million Parameters)":23,"Memory Usage (GB, fp32)":0.09,"Average":15.95,"ARCChallenge":9.4,"AlphaNLI":15.09,"HellaSwag":20.51,"PIQA":24.68,"Quail":3.46,"RARbCode":42.47,"RARbMath":62.39,"SIQA":1.53,"SpartQA":0.57,"TempReasonL1":1.05,"TempReasonL2Fact":16.57,"TempReasonL2Pure":0.49,"TempReasonL3Fact":14.01,"TempReasonL3Pure":6.27,"WinoGrande":20.73}
22
+ {"index":15,"Rank":22,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/facebook\/contriever\">contriever<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":15.86,"ARCChallenge":8.62,"AlphaNLI":31.77,"HellaSwag":14.42,"PIQA":24.64,"Quail":4.97,"RARbCode":9.28,"RARbMath":30.76,"SIQA":1.27,"SpartQA":10.94,"TempReasonL1":1.93,"TempReasonL2Fact":22.68,"TempReasonL2Pure":1.12,"TempReasonL3Fact":20.62,"TempReasonL3Pure":7.8,"WinoGrande":47.15}
23
+ {"index":3,"Rank":23,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-base-en-v1.5\">bge-base-en-v1.5<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":14.93,"ARCChallenge":9.66,"AlphaNLI":10.99,"HellaSwag":26.64,"PIQA":25.69,"Quail":1.42,"RARbCode":46.47,"RARbMath":46.86,"SIQA":0.94,"SpartQA":3.37,"TempReasonL1":1.07,"TempReasonL2Fact":17.23,"TempReasonL2Pure":1.29,"TempReasonL3Fact":13.36,"TempReasonL3Pure":5.2,"WinoGrande":13.76}
24
+ {"index":4,"Rank":24,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-large-en-v1.5\">bge-large-en-v1.5-instruct<\/a>","Model Size (Million Parameters)":1340,"Memory Usage (GB, fp32)":4.99,"Average":14.55,"ARCChallenge":8.86,"AlphaNLI":0.86,"HellaSwag":26.24,"PIQA":23.26,"Quail":2.72,"RARbCode":45.25,"RARbMath":49.82,"SIQA":0.59,"SpartQA":2.34,"TempReasonL1":1.17,"TempReasonL2Fact":21.19,"TempReasonL2Pure":2.1,"TempReasonL3Fact":17.59,"TempReasonL3Pure":5.99,"WinoGrande":10.31}
25
+ {"index":9,"Rank":25,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-small-en-v1.5\">bge-small-en-v1.5<\/a>","Model Size (Million Parameters)":24,"Memory Usage (GB, fp32)":0.09,"Average":14.15,"ARCChallenge":8.95,"AlphaNLI":11.64,"HellaSwag":25.44,"PIQA":23.92,"Quail":1.75,"RARbCode":42.36,"RARbMath":44.98,"SIQA":0.77,"SpartQA":3.55,"TempReasonL1":1.41,"TempReasonL2Fact":17.56,"TempReasonL2Pure":1.05,"TempReasonL3Fact":13.88,"TempReasonL3Pure":4.76,"WinoGrande":10.28}
26
+ {"index":21,"Rank":26,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-mpnet-base-v2\">all-mpnet-base-v2-instruct<\/a>","Model Size (Million Parameters)":110,"Memory Usage (GB, fp32)":0.41,"Average":13.84,"ARCChallenge":10.35,"AlphaNLI":1.96,"HellaSwag":13.01,"PIQA":27.18,"Quail":3.02,"RARbCode":48.95,"RARbMath":69.21,"SIQA":1.29,"SpartQA":1.01,"TempReasonL1":1.52,"TempReasonL2Fact":7.28,"TempReasonL2Pure":1.03,"TempReasonL3Fact":7.03,"TempReasonL3Pure":5.16,"WinoGrande":9.66}
27
+ {"index":2,"Rank":27,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-base-en-v1.5\">bge-base-en-v1.5-instruct<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":13.52,"ARCChallenge":8.85,"AlphaNLI":4.13,"HellaSwag":24.03,"PIQA":23.03,"Quail":1.25,"RARbCode":46.32,"RARbMath":45.62,"SIQA":0.24,"SpartQA":2.67,"TempReasonL1":0.8,"TempReasonL2Fact":16.56,"TempReasonL2Pure":1.33,"TempReasonL3Fact":12.68,"TempReasonL3Pure":5.08,"WinoGrande":10.27}
28
+ {"index":8,"Rank":28,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-small-en-v1.5\">bge-small-en-v1.5-instruct<\/a>","Model Size (Million Parameters)":24,"Memory Usage (GB, fp32)":0.09,"Average":12.6,"ARCChallenge":7.72,"AlphaNLI":1.26,"HellaSwag":23.41,"PIQA":20.79,"Quail":2.01,"RARbCode":41.52,"RARbMath":46.5,"SIQA":0.98,"SpartQA":2.86,"TempReasonL1":1.27,"TempReasonL2Fact":16.72,"TempReasonL2Pure":1.1,"TempReasonL3Fact":12.81,"TempReasonL3Pure":4.63,"WinoGrande":5.35}
29
+ {"index":14,"Rank":29,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/facebook\/contriever\">contriever-instruct<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":"","ARCChallenge":7.63,"AlphaNLI":27.09,"HellaSwag":"","PIQA":21.73,"Quail":4.92,"RARbCode":7.12,"RARbMath":21.83,"SIQA":0.88,"SpartQA":10.56,"TempReasonL1":1.8,"TempReasonL2Fact":22.03,"TempReasonL2Pure":0.94,"TempReasonL3Fact":20.82,"TempReasonL3Pure":7.15,"WinoGrande":26.3}
app.py CHANGED
The diff for this file is too large to render. See raw diff
 
boards_data/rar-b/data_overall/default.txt ADDED
File without changes
boards_data/rar-b/data_tasks/Retrieval/default.jsonl ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"index":13,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/GritLM\/GritLM-7B\">GritLM-7B<\/a>","Model Size (Million Parameters)":7240,"Memory Usage (GB, fp32)":26.97,"Average":35.2,"ARCChallenge":26.68,"AlphaNLI":34.0,"HellaSwag":39.45,"PIQA":44.35,"Quail":11.69,"RARbCode":84.0,"RARbMath":82.35,"SIQA":7.23,"SpartQA":9.29,"TempReasonL1":7.15,"TempReasonL2Fact":58.38,"TempReasonL2Pure":11.22,"TempReasonL3Fact":44.29,"TempReasonL3Pure":14.15,"WinoGrande":53.74}
2
+ {"index":25,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-embedding-models-and-api-updates\">text-embedding-3-large-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":31.13,"ARCChallenge":21.22,"AlphaNLI":34.23,"HellaSwag":31.4,"PIQA":37.52,"Quail":13.6,"RARbCode":89.41,"RARbMath":87.73,"SIQA":4.99,"SpartQA":7.45,"TempReasonL1":2.07,"TempReasonL2Fact":39.77,"TempReasonL2Pure":11.04,"TempReasonL3Fact":37.04,"TempReasonL3Pure":15.51,"WinoGrande":33.92}
3
+ {"index":12,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/GritLM\/GritLM-7B\">GritLM-7B-noinstruct<\/a>","Model Size (Million Parameters)":7240,"Memory Usage (GB, fp32)":26.97,"Average":30.57,"ARCChallenge":16.57,"AlphaNLI":29.56,"HellaSwag":36.03,"PIQA":35.8,"Quail":8.68,"RARbCode":83.14,"RARbMath":83.01,"SIQA":5.73,"SpartQA":1.56,"TempReasonL1":2.57,"TempReasonL2Fact":48.25,"TempReasonL2Pure":8.98,"TempReasonL3Fact":34.11,"TempReasonL3Pure":12.44,"WinoGrande":52.12}
4
+ {"index":26,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-embedding-models-and-api-updates\">text-embedding-3-large<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":29.95,"ARCChallenge":23.98,"AlphaNLI":37.27,"HellaSwag":34.12,"PIQA":41.96,"Quail":10.15,"RARbCode":89.64,"RARbMath":90.08,"SIQA":3.44,"SpartQA":7.51,"TempReasonL1":2.13,"TempReasonL2Fact":28.65,"TempReasonL2Pure":10.34,"TempReasonL3Fact":25.52,"TempReasonL3Pure":15.28,"WinoGrande":29.11}
5
+ {"index":16,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-mistral-7b-instruct\">e5-mistral-7b-instruct<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Average":28.41,"ARCChallenge":17.81,"AlphaNLI":26.12,"HellaSwag":34.85,"PIQA":39.37,"Quail":7.01,"RARbCode":78.46,"RARbMath":72.16,"SIQA":5.42,"SpartQA":9.92,"TempReasonL1":3.31,"TempReasonL2Fact":36.9,"TempReasonL2Pure":9.18,"TempReasonL3Fact":30.18,"TempReasonL3Pure":14.31,"WinoGrande":41.21}
6
+ {"index":17,"Rank":6,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-mistral-7b-instruct-noinstruct\">e5-mistral-7b-instruct-noinstruct<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Average":28.04,"ARCChallenge":20.48,"AlphaNLI":18.88,"HellaSwag":32.25,"PIQA":32.8,"Quail":6.25,"RARbCode":79.84,"RARbMath":76.19,"SIQA":5.08,"SpartQA":10.87,"TempReasonL1":3.04,"TempReasonL2Fact":35.63,"TempReasonL2Pure":9.32,"TempReasonL3Fact":30.41,"TempReasonL3Pure":14.39,"WinoGrande":45.18}
7
+ {"index":10,"Rank":7,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Cohere\/Cohere-embed-english-v3.0\">Cohere-embed-english-v3.0-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":25.41,"ARCChallenge":10.1,"AlphaNLI":18.75,"HellaSwag":29.02,"PIQA":27.89,"Quail":7.77,"RARbCode":56.56,"RARbMath":72.05,"SIQA":5.03,"SpartQA":3.33,"TempReasonL1":1.43,"TempReasonL2Fact":40.46,"TempReasonL2Pure":2.39,"TempReasonL3Fact":33.87,"TempReasonL3Pure":7.52,"WinoGrande":65.02}
8
+ {"index":28,"Rank":8,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-embedding-models-and-api-updates\">text-embedding-3-small<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":24.2,"ARCChallenge":14.63,"AlphaNLI":30.61,"HellaSwag":30.94,"PIQA":33.69,"Quail":6.11,"RARbCode":72.03,"RARbMath":71.07,"SIQA":3.03,"SpartQA":6.63,"TempReasonL1":2.35,"TempReasonL2Fact":25.68,"TempReasonL2Pure":2.76,"TempReasonL3Fact":22.09,"TempReasonL3Pure":9.79,"WinoGrande":31.53}
9
+ {"index":11,"Rank":9,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Cohere\/Cohere-embed-english-v3.0\">Cohere-embed-english-v3.0<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":23.65,"ARCChallenge":9.89,"AlphaNLI":15.1,"HellaSwag":26.35,"PIQA":28.49,"Quail":4.1,"RARbCode":57.19,"RARbMath":72.26,"SIQA":4.26,"SpartQA":3.75,"TempReasonL1":1.5,"TempReasonL2Fact":35.91,"TempReasonL2Pure":1.89,"TempReasonL3Fact":27.51,"TempReasonL3Pure":8.53,"WinoGrande":58.01}
10
+ {"index":24,"Rank":10,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-and-improved-embedding-model\">text-embedding-ada-002<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":22.57,"ARCChallenge":13.3,"AlphaNLI":25.65,"HellaSwag":29.29,"PIQA":31.02,"Quail":5.83,"RARbCode":83.39,"RARbMath":73.21,"SIQA":3.14,"SpartQA":4.23,"TempReasonL1":1.68,"TempReasonL2Fact":19.93,"TempReasonL2Pure":2.6,"TempReasonL3Fact":18.02,"TempReasonL3Pure":7.58,"WinoGrande":19.65}
11
+ {"index":27,"Rank":11,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-embedding-models-and-api-updates\">text-embedding-3-small-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":22.09,"ARCChallenge":13.76,"AlphaNLI":21.14,"HellaSwag":27.2,"PIQA":29.59,"Quail":6.64,"RARbCode":72.14,"RARbMath":64.31,"SIQA":2.98,"SpartQA":3.58,"TempReasonL1":2.29,"TempReasonL2Fact":26.34,"TempReasonL2Pure":3.17,"TempReasonL3Fact":22.72,"TempReasonL3Pure":9.98,"WinoGrande":25.49}
12
+ {"index":7,"Rank":12,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-m3\">bge-m3<\/a>","Model Size (Million Parameters)":2270,"Memory Usage (GB, fp32)":8.46,"Average":21.48,"ARCChallenge":9.02,"AlphaNLI":24.73,"HellaSwag":25.67,"PIQA":22.93,"Quail":7.51,"RARbCode":38.8,"RARbMath":69.19,"SIQA":4.89,"SpartQA":7.49,"TempReasonL1":0.99,"TempReasonL2Fact":33.23,"TempReasonL2Pure":0.68,"TempReasonL3Fact":30.05,"TempReasonL3Pure":5.28,"WinoGrande":41.72}
13
+ {"index":6,"Rank":13,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-m3\">bge-m3-instruct<\/a>","Model Size (Million Parameters)":2270,"Memory Usage (GB, fp32)":8.46,"Average":20.83,"ARCChallenge":9.03,"AlphaNLI":24.69,"HellaSwag":25.55,"PIQA":19.03,"Quail":7.08,"RARbCode":39.58,"RARbMath":64.51,"SIQA":4.77,"SpartQA":7.0,"TempReasonL1":0.8,"TempReasonL2Fact":34.99,"TempReasonL2Pure":0.62,"TempReasonL3Fact":32.47,"TempReasonL3Pure":7.01,"WinoGrande":35.33}
14
+ {"index":20,"Rank":14,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-MiniLM-L6-v2\">all-MiniLM-L6-v2<\/a>","Model Size (Million Parameters)":23,"Memory Usage (GB, fp32)":0.09,"Average":19.61,"ARCChallenge":9.48,"AlphaNLI":28.19,"HellaSwag":24.21,"PIQA":25.28,"Quail":3.92,"RARbCode":44.27,"RARbMath":68.19,"SIQA":1.56,"SpartQA":1.65,"TempReasonL1":1.53,"TempReasonL2Fact":17.65,"TempReasonL2Pure":0.46,"TempReasonL3Fact":14.16,"TempReasonL3Pure":6.33,"WinoGrande":47.33}
15
+ {"index":23,"Rank":15,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/openai.com\/blog\/new-and-improved-embedding-model\">text-embedding-ada-002-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Average":19.56,"ARCChallenge":11.85,"AlphaNLI":10.62,"HellaSwag":24.8,"PIQA":23.87,"Quail":5.79,"RARbCode":82.36,"RARbMath":67.26,"SIQA":2.64,"SpartQA":4.75,"TempReasonL1":1.44,"TempReasonL2Fact":19.38,"TempReasonL2Pure":2.43,"TempReasonL3Fact":17.58,"TempReasonL3Pure":7.31,"WinoGrande":11.36}
16
+ {"index":1,"Rank":16,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/github.com\/facebookresearch\/dpr-scale\/tree\/main\/dragon\">dragon-plus<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":19.1,"ARCChallenge":8.91,"AlphaNLI":32.1,"HellaSwag":27.69,"PIQA":28.01,"Quail":4.09,"RARbCode":17.58,"RARbMath":45.09,"SIQA":2.0,"SpartQA":10.34,"TempReasonL1":1.82,"TempReasonL2Fact":17.45,"TempReasonL2Pure":0.55,"TempReasonL3Fact":15.71,"TempReasonL3Pure":7.97,"WinoGrande":67.18}
17
+ {"index":22,"Rank":17,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-mpnet-base-v2\">all-mpnet-base-v2<\/a>","Model Size (Million Parameters)":110,"Memory Usage (GB, fp32)":0.41,"Average":18.03,"ARCChallenge":11.8,"AlphaNLI":22.41,"HellaSwag":26.27,"PIQA":29.03,"Quail":3.41,"RARbCode":53.21,"RARbMath":71.85,"SIQA":2.38,"SpartQA":0.22,"TempReasonL1":1.77,"TempReasonL2Fact":11.2,"TempReasonL2Pure":1.15,"TempReasonL3Fact":9.42,"TempReasonL3Pure":5.59,"WinoGrande":20.8}
18
+ {"index":5,"Rank":18,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-large-en-v1.5\">bge-large-en-v1.5<\/a>","Model Size (Million Parameters)":1340,"Memory Usage (GB, fp32)":4.99,"Average":17.7,"ARCChallenge":9.99,"AlphaNLI":13.13,"HellaSwag":28.5,"PIQA":27.99,"Quail":1.83,"RARbCode":48.12,"RARbMath":57.36,"SIQA":1.04,"SpartQA":2.99,"TempReasonL1":1.46,"TempReasonL2Fact":24.25,"TempReasonL2Pure":2.35,"TempReasonL3Fact":20.64,"TempReasonL3Pure":6.67,"WinoGrande":19.18}
19
+ {"index":18,"Rank":19,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-MiniLM-L12-v2\">all-MiniLM-L12-v2<\/a>","Model Size (Million Parameters)":33,"Memory Usage (GB, fp32)":0.12,"Average":17.35,"ARCChallenge":10.23,"AlphaNLI":25.35,"HellaSwag":24.08,"PIQA":26.44,"Quail":3.08,"RARbCode":42.44,"RARbMath":66.36,"SIQA":2.09,"SpartQA":2.67,"TempReasonL1":1.66,"TempReasonL2Fact":10.31,"TempReasonL2Pure":0.63,"TempReasonL3Fact":11.11,"TempReasonL3Pure":6.63,"WinoGrande":27.2}
20
+ {"index":0,"Rank":20,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/github.com\/facebookresearch\/dpr-scale\/tree\/main\/dragon\">dragon-plus-instruct<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":16.73,"ARCChallenge":8.24,"AlphaNLI":25.18,"HellaSwag":24.06,"PIQA":26.35,"Quail":4.2,"RARbCode":12.84,"RARbMath":36.15,"SIQA":1.75,"SpartQA":10.82,"TempReasonL1":1.54,"TempReasonL2Fact":16.11,"TempReasonL2Pure":0.57,"TempReasonL3Fact":14.81,"TempReasonL3Pure":7.46,"WinoGrande":60.84}
21
+ {"index":19,"Rank":21,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-MiniLM-L6-v2\">all-MiniLM-L6-v2-instruct<\/a>","Model Size (Million Parameters)":23,"Memory Usage (GB, fp32)":0.09,"Average":15.95,"ARCChallenge":9.4,"AlphaNLI":15.09,"HellaSwag":20.51,"PIQA":24.68,"Quail":3.46,"RARbCode":42.47,"RARbMath":62.39,"SIQA":1.53,"SpartQA":0.57,"TempReasonL1":1.05,"TempReasonL2Fact":16.57,"TempReasonL2Pure":0.49,"TempReasonL3Fact":14.01,"TempReasonL3Pure":6.27,"WinoGrande":20.73}
22
+ {"index":15,"Rank":22,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/facebook\/contriever\">contriever<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":15.86,"ARCChallenge":8.62,"AlphaNLI":31.77,"HellaSwag":14.42,"PIQA":24.64,"Quail":4.97,"RARbCode":9.28,"RARbMath":30.76,"SIQA":1.27,"SpartQA":10.94,"TempReasonL1":1.93,"TempReasonL2Fact":22.68,"TempReasonL2Pure":1.12,"TempReasonL3Fact":20.62,"TempReasonL3Pure":7.8,"WinoGrande":47.15}
23
+ {"index":3,"Rank":23,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-base-en-v1.5\">bge-base-en-v1.5<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":14.93,"ARCChallenge":9.66,"AlphaNLI":10.99,"HellaSwag":26.64,"PIQA":25.69,"Quail":1.42,"RARbCode":46.47,"RARbMath":46.86,"SIQA":0.94,"SpartQA":3.37,"TempReasonL1":1.07,"TempReasonL2Fact":17.23,"TempReasonL2Pure":1.29,"TempReasonL3Fact":13.36,"TempReasonL3Pure":5.2,"WinoGrande":13.76}
24
+ {"index":4,"Rank":24,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-large-en-v1.5\">bge-large-en-v1.5-instruct<\/a>","Model Size (Million Parameters)":1340,"Memory Usage (GB, fp32)":4.99,"Average":14.55,"ARCChallenge":8.86,"AlphaNLI":0.86,"HellaSwag":26.24,"PIQA":23.26,"Quail":2.72,"RARbCode":45.25,"RARbMath":49.82,"SIQA":0.59,"SpartQA":2.34,"TempReasonL1":1.17,"TempReasonL2Fact":21.19,"TempReasonL2Pure":2.1,"TempReasonL3Fact":17.59,"TempReasonL3Pure":5.99,"WinoGrande":10.31}
25
+ {"index":9,"Rank":25,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-small-en-v1.5\">bge-small-en-v1.5<\/a>","Model Size (Million Parameters)":24,"Memory Usage (GB, fp32)":0.09,"Average":14.15,"ARCChallenge":8.95,"AlphaNLI":11.64,"HellaSwag":25.44,"PIQA":23.92,"Quail":1.75,"RARbCode":42.36,"RARbMath":44.98,"SIQA":0.77,"SpartQA":3.55,"TempReasonL1":1.41,"TempReasonL2Fact":17.56,"TempReasonL2Pure":1.05,"TempReasonL3Fact":13.88,"TempReasonL3Pure":4.76,"WinoGrande":10.28}
26
+ {"index":21,"Rank":26,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sentence-transformers\/all-mpnet-base-v2\">all-mpnet-base-v2-instruct<\/a>","Model Size (Million Parameters)":110,"Memory Usage (GB, fp32)":0.41,"Average":13.84,"ARCChallenge":10.35,"AlphaNLI":1.96,"HellaSwag":13.01,"PIQA":27.18,"Quail":3.02,"RARbCode":48.95,"RARbMath":69.21,"SIQA":1.29,"SpartQA":1.01,"TempReasonL1":1.52,"TempReasonL2Fact":7.28,"TempReasonL2Pure":1.03,"TempReasonL3Fact":7.03,"TempReasonL3Pure":5.16,"WinoGrande":9.66}
27
+ {"index":2,"Rank":27,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-base-en-v1.5\">bge-base-en-v1.5-instruct<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":13.52,"ARCChallenge":8.85,"AlphaNLI":4.13,"HellaSwag":24.03,"PIQA":23.03,"Quail":1.25,"RARbCode":46.32,"RARbMath":45.62,"SIQA":0.24,"SpartQA":2.67,"TempReasonL1":0.8,"TempReasonL2Fact":16.56,"TempReasonL2Pure":1.33,"TempReasonL3Fact":12.68,"TempReasonL3Pure":5.08,"WinoGrande":10.27}
28
+ {"index":8,"Rank":28,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/BAAI\/bge-small-en-v1.5\">bge-small-en-v1.5-instruct<\/a>","Model Size (Million Parameters)":24,"Memory Usage (GB, fp32)":0.09,"Average":12.6,"ARCChallenge":7.72,"AlphaNLI":1.26,"HellaSwag":23.41,"PIQA":20.79,"Quail":2.01,"RARbCode":41.52,"RARbMath":46.5,"SIQA":0.98,"SpartQA":2.86,"TempReasonL1":1.27,"TempReasonL2Fact":16.72,"TempReasonL2Pure":1.1,"TempReasonL3Fact":12.81,"TempReasonL3Pure":4.63,"WinoGrande":5.35}
29
+ {"index":14,"Rank":29,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/facebook\/contriever\">contriever-instruct<\/a>","Model Size (Million Parameters)":438,"Memory Usage (GB, fp32)":1.63,"Average":"","ARCChallenge":7.63,"AlphaNLI":27.09,"HellaSwag":"","PIQA":21.73,"Quail":4.92,"RARbCode":7.12,"RARbMath":21.83,"SIQA":0.88,"SpartQA":10.56,"TempReasonL1":1.8,"TempReasonL2Fact":22.03,"TempReasonL2Pure":0.94,"TempReasonL3Fact":20.82,"TempReasonL3Pure":7.15,"WinoGrande":26.3}
config.yaml CHANGED
@@ -403,6 +403,32 @@ boards:
403
  credits: null
404
  tasks:
405
  STS: ["STS17 (ar-ar)", "STS17 (en-ar)", "STS17 (en-de)", "STS17 (en-tr)", "STS17 (es-en)", "STS17 (es-es)", "STS17 (fr-en)", "STS17 (it-en)", "STS17 (ko-ko)", "STS17 (nl-en)", "STS22 (ar)", "STS22 (de)", "STS22 (de-en)", "STS22 (de-fr)", "STS22 (de-pl)", "STS22 (es)", "STS22 (es-en)", "STS22 (es-it)", "STS22 (fr)", "STS22 (fr-pl)", "STS22 (it)", "STS22 (pl)", "STS22 (pl-en)", "STS22 (ru)", "STS22 (tr)", "STS22 (zh-en)", "STSBenchmark"]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
406
  bright:
407
  title: BRIGHT
408
  language_long: "English"
 
403
  credits: null
404
  tasks:
405
  STS: ["STS17 (ar-ar)", "STS17 (en-ar)", "STS17 (en-de)", "STS17 (en-tr)", "STS17 (es-en)", "STS17 (es-es)", "STS17 (fr-en)", "STS17 (it-en)", "STS17 (ko-ko)", "STS17 (nl-en)", "STS22 (ar)", "STS22 (de)", "STS22 (de-en)", "STS22 (de-fr)", "STS22 (de-pl)", "STS22 (es)", "STS22 (es-en)", "STS22 (es-it)", "STS22 (fr)", "STS22 (fr-pl)", "STS22 (it)", "STS22 (pl)", "STS22 (pl-en)", "STS22 (ru)", "STS22 (tr)", "STS22 (zh-en)", "STSBenchmark"]
406
+ rar-b:
407
+ title: RAR-b
408
+ language_long: "English"
409
+ has_overall: false
410
+ acronym: null
411
+ icon: "📚"
412
+ special_icons: null
413
+ credits: "[RAR-b (Xiao et al.)](https://arxiv.org/abs/2404.06347/)"
414
+ metric: nDCG@10
415
+ tasks:
416
+ Retrieval:
417
+ - ARCChallenge
418
+ - AlphaNLI
419
+ - HellaSwag
420
+ - PIQA
421
+ - Quail
422
+ - RARbCode
423
+ - RARbMath
424
+ - SIQA
425
+ - SpartQA
426
+ - TempReasonL1
427
+ - TempReasonL2Fact
428
+ - TempReasonL2Pure
429
+ - TempReasonL3Fact
430
+ - TempReasonL3Pure
431
+ - WinoGrande
432
  bright:
433
  title: BRIGHT
434
  language_long: "English"
model_meta.yaml CHANGED
@@ -7,6 +7,7 @@ model_meta:
7
  is_external: true
8
  is_proprietary: true
9
  is_sentence_transformers_compatible: false
 
10
  Cohere-embed-english-v3.0:
11
  link: https://huggingface.co/Cohere/Cohere-embed-english-v3.0
12
  seq_len: 512
@@ -15,6 +16,16 @@ model_meta:
15
  is_external: true
16
  is_proprietary: true
17
  is_sentence_transformers_compatible: false
 
 
 
 
 
 
 
 
 
 
18
  Cohere-embed-multilingual-light-v3.0:
19
  link: https://huggingface.co/Cohere/Cohere-embed-multilingual-light-v3.0
20
  seq_len: 512
@@ -23,6 +34,7 @@ model_meta:
23
  is_external: true
24
  is_proprietary: true
25
  is_sentence_transformers_compatible: false
 
26
  Cohere-embed-multilingual-v3.0:
27
  link: https://huggingface.co/Cohere/Cohere-embed-multilingual-v3.0
28
  seq_len: 512
@@ -31,6 +43,7 @@ model_meta:
31
  is_external: true
32
  is_proprietary: true
33
  is_sentence_transformers_compatible: false
 
34
  DanskBERT:
35
  link: https://huggingface.co/vesteinn/DanskBERT
36
  seq_len: 514
@@ -39,6 +52,7 @@ model_meta:
39
  is_external: true
40
  is_proprietary: false
41
  is_sentence_transformers_compatible: true
 
42
  FollowIR-7B:
43
  link: https://huggingface.co/jhu-clsp/FollowIR-7B
44
  seq_len: 4096
@@ -46,6 +60,7 @@ model_meta:
46
  is_external: true
47
  is_propietary: false
48
  is_sentence_transformer_compatible: false
 
49
  GritLM-7B:
50
  link: https://huggingface.co/GritLM/GritLM-7B
51
  seq_len: 4096
@@ -53,6 +68,15 @@ model_meta:
53
  is_external: true
54
  is_propietary: false
55
  is_sentence_transformer_compatible: false
 
 
 
 
 
 
 
 
 
56
  LASER2:
57
  link: https://github.com/facebookresearch/LASER
58
  seq_len: N/A
@@ -61,6 +85,7 @@ model_meta:
61
  is_external: true
62
  is_proprietary: false
63
  is_sentence_transformers_compatible: false
 
64
  LLM2Vec-Llama-2-supervised:
65
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Llama-2-7b-chat-hf-mntp-supervised
66
  seq_len: 4096
@@ -69,6 +94,7 @@ model_meta:
69
  is_external: true
70
  is_proprietary: false
71
  is_sentence_transformers_compatible: false
 
72
  LLM2Vec-Llama-2-unsupervised:
73
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Llama-2-7b-chat-hf-mntp-unsup-simcse
74
  seq_len: 4096
@@ -77,6 +103,7 @@ model_meta:
77
  is_external: true
78
  is_proprietary: false
79
  is_sentence_transformers_compatible: false
 
80
  LLM2Vec-Meta-Llama-3-supervised:
81
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Meta-Llama-3-8B-Instruct-mntp-supervised
82
  seq_len: 8192
@@ -85,6 +112,7 @@ model_meta:
85
  is_external: true
86
  is_proprietary: false
87
  is_sentence_transformers_compatible: false
 
88
  LLM2Vec-Meta-Llama-3-unsupervised:
89
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Meta-Llama-3-8B-Instruct-mntp-unsup-simcse
90
  seq_len: 8192
@@ -93,6 +121,7 @@ model_meta:
93
  is_external: true
94
  is_proprietary: false
95
  is_sentence_transformers_compatible: false
 
96
  LLM2Vec-Mistral-supervised:
97
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Mistral-7B-Instruct-v2-mntp-supervised
98
  seq_len: 32768
@@ -101,6 +130,7 @@ model_meta:
101
  is_external: true
102
  is_proprietary: false
103
  is_sentence_transformers_compatible: false
 
104
  LLM2Vec-Mistral-unsupervised:
105
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Mistral-7B-Instruct-v2-mntp-unsup-simcse
106
  seq_len: 32768
@@ -109,6 +139,7 @@ model_meta:
109
  is_external: true
110
  is_proprietary: false
111
  is_sentence_transformers_compatible: false
 
112
  LLM2Vec-Sheared-Llama-supervised:
113
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp-supervised
114
  seq_len: 4096
@@ -117,6 +148,7 @@ model_meta:
117
  is_external: true
118
  is_proprietary: false
119
  is_sentence_transformers_compatible: false
 
120
  LLM2Vec-Sheared-Llama-unsupervised:
121
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp-unsup-simcse
122
  seq_len: 4096
@@ -125,6 +157,7 @@ model_meta:
125
  is_external: true
126
  is_proprietary: false
127
  is_sentence_transformers_compatible: false
 
128
  LaBSE:
129
  link: https://huggingface.co/sentence-transformers/LaBSE
130
  seq_len: 512
@@ -133,6 +166,34 @@ model_meta:
133
  is_external: true
134
  is_proprietary: false
135
  is_sentence_transformers_compatible: true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
136
  OpenSearch-text-hybrid:
137
  link: https://help.aliyun.com/zh/open-search/vector-search-edition/hybrid-retrieval
138
  seq_len: 512
@@ -141,6 +202,7 @@ model_meta:
141
  is_external: true
142
  is_proprietary: true
143
  is_sentence_transformers_compatible: false
 
144
  SFR-Embedding-Mistral:
145
  link: https://huggingface.co/Salesforce/SFR-Embedding-Mistral
146
  seq_len: 32768
@@ -149,6 +211,7 @@ model_meta:
149
  is_external: true
150
  is_proprietary: false
151
  is_sentence_transformers_compatible: true
 
152
  all-MiniLM-L12-v2:
153
  link: https://huggingface.co/sentence-transformers/all-MiniLM-L12-v2
154
  seq_len: 512
@@ -157,6 +220,7 @@ model_meta:
157
  is_external: true
158
  is_proprietary: false
159
  is_sentence_transformers_compatible: true
 
160
  all-MiniLM-L6-v2:
161
  link: https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2
162
  seq_len: 512
@@ -165,6 +229,16 @@ model_meta:
165
  is_external: true
166
  is_proprietary: false
167
  is_sentence_transformers_compatible: true
 
 
 
 
 
 
 
 
 
 
168
  all-mpnet-base-v2:
169
  link: https://huggingface.co/sentence-transformers/all-mpnet-base-v2
170
  seq_len: 514
@@ -173,6 +247,16 @@ model_meta:
173
  is_external: true
174
  is_proprietary: false
175
  is_sentence_transformers_compatible: true
 
 
 
 
 
 
 
 
 
 
176
  allenai-specter:
177
  link: https://huggingface.co/sentence-transformers/allenai-specter
178
  seq_len: 512
@@ -181,6 +265,7 @@ model_meta:
181
  is_external: true
182
  is_proprietary: false
183
  is_sentence_transformers_compatible: true
 
184
  bert-base-10lang-cased:
185
  link: https://huggingface.co/Geotrend/bert-base-10lang-cased
186
  seq_len: 512
@@ -189,6 +274,7 @@ model_meta:
189
  is_external: true
190
  is_proprietary: false
191
  is_sentence_transformers_compatible: true
 
192
  bert-base-15lang-cased:
193
  link: https://huggingface.co/Geotrend/bert-base-15lang-cased
194
  seq_len: 512
@@ -197,6 +283,7 @@ model_meta:
197
  is_external: true
198
  is_proprietary: false
199
  is_sentence_transformers_compatible: true
 
200
  bert-base-25lang-cased:
201
  link: https://huggingface.co/Geotrend/bert-base-25lang-cased
202
  seq_len: 512
@@ -205,6 +292,7 @@ model_meta:
205
  is_external: true
206
  is_proprietary: false
207
  is_sentence_transformers_compatible: true
 
208
  bert-base-multilingual-cased:
209
  link: https://huggingface.co/google-bert/bert-base-multilingual-cased
210
  seq_len: 512
@@ -213,6 +301,7 @@ model_meta:
213
  is_external: true
214
  is_proprietary: false
215
  is_sentence_transformers_compatible: true
 
216
  bert-base-multilingual-uncased:
217
  link: https://huggingface.co/google-bert/bert-base-multilingual-uncased
218
  seq_len: 512
@@ -221,6 +310,7 @@ model_meta:
221
  is_external: true
222
  is_proprietary: false
223
  is_sentence_transformers_compatible: true
 
224
  bert-base-swedish-cased:
225
  link: https://huggingface.co/KB/bert-base-swedish-cased
226
  seq_len: 512
@@ -229,6 +319,7 @@ model_meta:
229
  is_external: true
230
  is_proprietary: false
231
  is_sentence_transformers_compatible: true
 
232
  bert-base-uncased:
233
  link: https://huggingface.co/bert-base-uncased
234
  seq_len: 512
@@ -237,6 +328,25 @@ model_meta:
237
  is_external: true
238
  is_proprietary: false
239
  is_sentence_transformers_compatible: true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
240
  bge-base-zh-v1.5:
241
  link: https://huggingface.co/BAAI/bge-base-zh-v1.5
242
  seq_len: 512
@@ -245,14 +355,25 @@ model_meta:
245
  is_external: true
246
  is_proprietary: false
247
  is_sentence_transformers_compatible: true
 
248
  bge-large-en-v1.5:
249
  link: https://huggingface.co/BAAI/bge-large-en-v1.5
250
  seq_len: 512
251
- size: null
 
 
 
 
 
 
 
 
 
252
  dim: 1024
253
  is_external: true
254
  is_proprietary: false
255
  is_sentence_transformers_compatible: false
 
256
  bge-large-zh-noinstruct:
257
  link: https://huggingface.co/BAAI/bge-large-zh-noinstruct
258
  seq_len: 512
@@ -261,6 +382,7 @@ model_meta:
261
  is_external: true
262
  is_proprietary: false
263
  is_sentence_transformers_compatible: true
 
264
  bge-large-zh-v1.5:
265
  link: https://huggingface.co/BAAI/bge-large-zh-v1.5
266
  seq_len: 512
@@ -269,6 +391,7 @@ model_meta:
269
  is_external: true
270
  is_proprietary: false
271
  is_sentence_transformers_compatible: true
 
272
  bge-m3:
273
  link: https://huggingface.co/BAAI/bge-m3
274
  seq_len: 8192
@@ -277,6 +400,34 @@ model_meta:
277
  is_external: true
278
  is_proprietary: false
279
  is_sentence_transformers_compatible: false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
280
  bge-small-zh-v1.5:
281
  link: https://huggingface.co/BAAI/bge-small-zh-v1.5
282
  seq_len: 512
@@ -285,12 +436,21 @@ model_meta:
285
  is_external: true
286
  is_proprietary: false
287
  is_sentence_transformers_compatible: true
288
- bm25:
 
289
  link: https://en.wikipedia.org/wiki/Okapi_BM25
290
  size: 0
291
  is_external: true
292
  is_proprietary: false
293
  is_sentence_transformers_compatible: false
 
 
 
 
 
 
 
 
294
  camembert-base:
295
  link: https://huggingface.co/almanach/camembert-base
296
  seq_len: 512
@@ -299,6 +459,7 @@ model_meta:
299
  is_external: false
300
  is_proprietary: false
301
  is_sentence_transformers_compatible: true
 
302
  camembert-large:
303
  link: https://huggingface.co/almanach/camembert-large
304
  seq_len: 512
@@ -307,6 +468,7 @@ model_meta:
307
  is_external: false
308
  is_proprietary: false
309
  is_sentence_transformers_compatible: true
 
310
  contriever-base-msmarco:
311
  link: https://huggingface.co/nthakur/contriever-base-msmarco
312
  seq_len: 512
@@ -315,6 +477,25 @@ model_meta:
315
  is_external: true
316
  is_proprietary: false
317
  is_sentence_transformers_compatible: true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
318
  cross-en-de-roberta-sentence-transformer:
319
  link: https://huggingface.co/T-Systems-onsite/cross-en-de-roberta-sentence-transformer
320
  seq_len: 514
@@ -323,6 +504,7 @@ model_meta:
323
  is_external: true
324
  is_proprietary: false
325
  is_sentence_transformers_compatible: true
 
326
  dfm-encoder-large-v1:
327
  link: https://huggingface.co/chcaa/dfm-encoder-large-v1
328
  seq_len: 512
@@ -331,6 +513,7 @@ model_meta:
331
  is_external: true
332
  is_proprietary: false
333
  is_sentence_transformers_compatible: true
 
334
  dfm-sentence-encoder-large-1:
335
  link: https://huggingface.co/chcaa/dfm-encoder-large-v1
336
  seq_len: 512
@@ -339,6 +522,7 @@ model_meta:
339
  is_external: true
340
  is_proprietary: false
341
  is_sentence_transformers_compatible: true
 
342
  distilbert-base-25lang-cased:
343
  link: https://huggingface.co/Geotrend/distilbert-base-25lang-cased
344
  seq_len: 512
@@ -347,6 +531,7 @@ model_meta:
347
  is_external: false
348
  is_proprietary: false
349
  is_sentence_transformers_compatible: true
 
350
  distilbert-base-en-fr-cased:
351
  link: https://huggingface.co/Geotrend/distilbert-base-en-fr-cased
352
  seq_len: 512
@@ -355,6 +540,7 @@ model_meta:
355
  is_external: false
356
  is_proprietary: false
357
  is_sentence_transformers_compatible: true
 
358
  distilbert-base-en-fr-es-pt-it-cased:
359
  link: https://huggingface.co/Geotrend/distilbert-base-en-fr-es-pt-it-cased
360
  seq_len: 512
@@ -363,6 +549,7 @@ model_meta:
363
  is_external: false
364
  is_proprietary: false
365
  is_sentence_transformers_compatible: true
 
366
  distilbert-base-fr-cased:
367
  link: https://huggingface.co/Geotrend/distilbert-base-fr-cased
368
  seq_len: 512
@@ -371,6 +558,7 @@ model_meta:
371
  is_external: false
372
  is_proprietary: false
373
  is_sentence_transformers_compatible: true
 
374
  distilbert-base-uncased:
375
  link: https://huggingface.co/distilbert-base-uncased
376
  seq_len: 512
@@ -379,6 +567,7 @@ model_meta:
379
  is_external: false
380
  is_proprietary: false
381
  is_sentence_transformers_compatible: true
 
382
  distiluse-base-multilingual-cased-v2:
383
  link: https://huggingface.co/sentence-transformers/distiluse-base-multilingual-cased-v2
384
  seq_len: 512
@@ -387,6 +576,25 @@ model_meta:
387
  is_external: true
388
  is_proprietary: false
389
  is_sentence_transformers_compatible: true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
390
  e5-base-4k:
391
  link: https://huggingface.co/dwzhu/e5-base-4k
392
  seq_len: 512
@@ -395,6 +603,7 @@ model_meta:
395
  is_external: true
396
  is_proprietary: false
397
  is_sentence_transformers_compatible: true
 
398
  e5-base-v2:
399
  link: https://huggingface.co/intfloat/e5-base-v2
400
  seq_len: 512
@@ -403,6 +612,7 @@ model_meta:
403
  is_external: true
404
  is_proprietary: false
405
  is_sentence_transformers_compatible: true
 
406
  e5-base:
407
  link: https://huggingface.co/intfloat/e5-base
408
  seq_len: 512
@@ -411,6 +621,7 @@ model_meta:
411
  is_external: true
412
  is_proprietary: false
413
  is_sentence_transformers_compatible: true
 
414
  e5-large-v2:
415
  link: https://huggingface.co/intfloat/e5-large-v2
416
  seq_len: 512
@@ -419,6 +630,7 @@ model_meta:
419
  is_external: true
420
  is_proprietary: false
421
  is_sentence_transformers_compatible: true
 
422
  e5-large:
423
  link: https://huggingface.co/intfloat/e5-large
424
  seq_len: 512
@@ -427,6 +639,7 @@ model_meta:
427
  is_external: true
428
  is_proprietary: false
429
  is_sentence_transformers_compatible: true
 
430
  e5-mistral-7b-instruct:
431
  link: https://huggingface.co/intfloat/e5-mistral-7b-instruct
432
  seq_len: 32768
@@ -435,6 +648,16 @@ model_meta:
435
  is_external: true
436
  is_proprietary: false
437
  is_sentence_transformers_compatible: true
 
 
 
 
 
 
 
 
 
 
438
  e5-small:
439
  link: https://huggingface.co/intfloat/e5-small
440
  seq_len: 512
@@ -443,6 +666,7 @@ model_meta:
443
  is_external: true
444
  is_proprietary: false
445
  is_sentence_transformers_compatible: true
 
446
  electra-small-nordic:
447
  link: https://huggingface.co/jonfd/electra-small-nordic
448
  seq_len: 512
@@ -451,6 +675,7 @@ model_meta:
451
  is_external: true
452
  is_proprietary: false
453
  is_sentence_transformers_compatible: true
 
454
  electra-small-swedish-cased-discriminator:
455
  link: https://huggingface.co/KBLab/electra-small-swedish-cased-discriminator
456
  seq_len: 512
@@ -459,6 +684,7 @@ model_meta:
459
  is_external: true
460
  is_proprietary: false
461
  is_sentence_transformers_compatible: true
 
462
  elser-v2:
463
  link: https://www.elastic.co/guide/en/machine-learning/current/ml-nlp-elser.html
464
  seq_len: 512
@@ -467,6 +693,7 @@ model_meta:
467
  is_external: true
468
  is_proprietary: false
469
  is_sentence_transformers_compatible: false
 
470
  flan-t5-base:
471
  link: https://huggingface.co/google/flan-t5-base
472
  seq_len: 512
@@ -475,6 +702,7 @@ model_meta:
475
  is_external: true
476
  is_proprietary: false
477
  is_sentence_transformers_compatible: true
 
478
  flan-t5-large:
479
  link: https://huggingface.co/google/flan-t5-large
480
  seq_len: 512
@@ -483,6 +711,7 @@ model_meta:
483
  is_external: true
484
  is_proprietary: false
485
  is_sentence_transformers_compatible: true
 
486
  flaubert_base_cased:
487
  link: https://huggingface.co/flaubert/flaubert_base_cased
488
  seq_len: 512
@@ -491,6 +720,7 @@ model_meta:
491
  is_external: true
492
  is_proprietary: false
493
  is_sentence_transformers_compatible: true
 
494
  flaubert_base_uncased:
495
  link: https://huggingface.co/flaubert/flaubert_base_uncased
496
  seq_len: 512
@@ -499,6 +729,7 @@ model_meta:
499
  is_external: true
500
  is_proprietary: false
501
  is_sentence_transformers_compatible: true
 
502
  flaubert_large_cased:
503
  link: https://huggingface.co/flaubert/flaubert_large_cased
504
  seq_len: 512
@@ -507,6 +738,7 @@ model_meta:
507
  is_external: true
508
  is_proprietary: false
509
  is_sentence_transformers_compatible: true
 
510
  gbert-base:
511
  link: https://huggingface.co/deepset/gbert-base
512
  seq_len: 512
@@ -515,6 +747,7 @@ model_meta:
515
  is_external: true
516
  is_proprietary: false
517
  is_sentence_transformers_compatible: true
 
518
  gbert-large:
519
  link: https://huggingface.co/deepset/gbert-large
520
  seq_len: 512
@@ -523,6 +756,7 @@ model_meta:
523
  is_external: true
524
  is_proprietary: false
525
  is_sentence_transformers_compatible: true
 
526
  gelectra-base:
527
  link: https://huggingface.co/deepset/gelectra-base
528
  seq_len: 512
@@ -531,6 +765,7 @@ model_meta:
531
  is_external: true
532
  is_proprietary: false
533
  is_sentence_transformers_compatible: true
 
534
  gelectra-large:
535
  link: https://huggingface.co/deepset/gelectra-large
536
  seq_len: 512
@@ -539,6 +774,7 @@ model_meta:
539
  is_external: true
540
  is_proprietary: false
541
  is_sentence_transformers_compatible: true
 
542
  glove.6B.300d:
543
  link: https://huggingface.co/sentence-transformers/average_word_embeddings_glove.6B.300d
544
  seq_len: N/A
@@ -547,6 +783,7 @@ model_meta:
547
  is_external: true
548
  is_proprietary: false
549
  is_sentence_transformers_compatible: true
 
550
  google-gecko-256.text-embedding-preview-0409:
551
  link: https://cloud.google.com/vertex-ai/generative-ai/docs/embeddings/get-text-embeddings#latest_models
552
  seq_len: 2048
@@ -555,6 +792,7 @@ model_meta:
555
  is_external: true
556
  is_proprietary: true
557
  is_sentence_transformers_compatible: false
 
558
  google-gecko.text-embedding-preview-0409:
559
  link: https://cloud.google.com/vertex-ai/generative-ai/docs/embeddings/get-text-embeddings#latest_models
560
  seq_len: 2048
@@ -563,6 +801,7 @@ model_meta:
563
  is_external: true
564
  is_proprietary: true
565
  is_sentence_transformers_compatible: false
 
566
  gottbert-base:
567
  link: https://huggingface.co/uklfr/gottbert-base
568
  seq_len: 512
@@ -571,6 +810,7 @@ model_meta:
571
  is_external: true
572
  is_proprietary: false
573
  is_sentence_transformers_compatible: true
 
574
  gte-Qwen1.5-7B-instruct:
575
  link: https://huggingface.co/Alibaba-NLP/gte-Qwen1.5-7B-instruct
576
  seq_len: 32768
@@ -579,6 +819,7 @@ model_meta:
579
  is_external: true
580
  is_proprietary: false
581
  is_sentence_transformers_compatible: true
 
582
  gte-Qwen2-7B-instruct:
583
  link: https://huggingface.co/Alibaba-NLP/gte-Qwen2-7B-instruct
584
  seq_len: 32768
@@ -587,6 +828,7 @@ model_meta:
587
  is_external: true
588
  is_proprietary: false
589
  is_sentence_transformers_compatible: true
 
590
  gtr-t5-base:
591
  link: https://huggingface.co/sentence-transformers/gtr-t5-base
592
  seq_len: 512
@@ -595,6 +837,7 @@ model_meta:
595
  is_external: true
596
  is_proprietary: false
597
  is_sentence_transformers_compatible: true
 
598
  gtr-t5-large:
599
  link: https://huggingface.co/sentence-transformers/gtr-t5-large
600
  seq_len: 512
@@ -603,6 +846,7 @@ model_meta:
603
  is_external: true
604
  is_proprietary: false
605
  is_sentence_transformers_compatible: true
 
606
  gtr-t5-xl:
607
  link: https://huggingface.co/sentence-transformers/gtr-t5-xl
608
  seq_len: 512
@@ -611,6 +855,7 @@ model_meta:
611
  is_external: true
612
  is_proprietary: false
613
  is_sentence_transformers_compatible: true
 
614
  gtr-t5-xxl:
615
  link: https://huggingface.co/sentence-transformers/gtr-t5-xxl
616
  seq_len: 512
@@ -619,6 +864,7 @@ model_meta:
619
  is_external: true
620
  is_proprietary: false
621
  is_sentence_transformers_compatible: true
 
622
  herbert-base-retrieval-v2:
623
  link: https://huggingface.co/ipipan/herbert-base-retrieval-v2
624
  seq_len: 514
@@ -627,6 +873,7 @@ model_meta:
627
  is_external: true
628
  is_proprietary: false
629
  is_sentence_transformers_compatible: true
 
630
  instructor-base:
631
  link: https://huggingface.co/hkunlp/instructor-base
632
  seq_len: N/A
@@ -635,6 +882,7 @@ model_meta:
635
  is_external: true
636
  is_proprietary: false
637
  is_sentence_transformers_compatible: true
 
638
  instructor-large:
639
  link: https://huggingface.co/hkunlp/instructor-large
640
  seq_len: 512
@@ -643,6 +891,7 @@ model_meta:
643
  is_external: true
644
  is_proprietary: false
645
  is_sentence_transformers_compatible: true
 
646
  instructor-xl:
647
  link: https://huggingface.co/hkunlp/instructor-xl
648
  seq_len: 512
@@ -651,6 +900,7 @@ model_meta:
651
  is_external: true
652
  is_proprietary: false
653
  is_sentence_transformers_compatible: true
 
654
  jina-embeddings-v2-base-en:
655
  link: https://huggingface.co/jinaai/jina-embeddings-v2-base-en
656
  seq_len: 8192
@@ -659,6 +909,7 @@ model_meta:
659
  is_external: true
660
  is_proprietary: false
661
  is_sentence_transformers_compatible: true
 
662
  komninos:
663
  link: https://huggingface.co/sentence-transformers/average_word_embeddings_komninos
664
  seq_len: N/A
@@ -667,6 +918,7 @@ model_meta:
667
  is_external: true
668
  is_proprietary: false
669
  is_sentence_transformers_compatible: true
 
670
  llama-2-7b-chat:
671
  link: https://huggingface.co/meta-llama/Llama-2-7b-chat-hf
672
  seq_len: 4096
@@ -675,6 +927,7 @@ model_meta:
675
  is_external: true
676
  is_proprietary: false
677
  is_sentence_transformers_compatible: false
 
678
  luotuo-bert-medium:
679
  link: https://huggingface.co/silk-road/luotuo-bert-medium
680
  seq_len: 512
@@ -683,6 +936,7 @@ model_meta:
683
  is_external: true
684
  is_proprietary: false
685
  is_sentence_transformers_compatible: true
 
686
  m3e-base:
687
  link: https://huggingface.co/moka-ai/m3e-base
688
  seq_len: 512
@@ -691,6 +945,7 @@ model_meta:
691
  is_external: true
692
  is_proprietary: false
693
  is_sentence_transformers_compatible: true
 
694
  m3e-large:
695
  link: https://huggingface.co/moka-ai/m3e-large
696
  seq_len: 512
@@ -699,6 +954,7 @@ model_meta:
699
  is_external: true
700
  is_proprietary: false
701
  is_sentence_transformers_compatible: true
 
702
  mistral-7b-instruct-v0.2:
703
  link: https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2
704
  seq_len: 4096
@@ -707,6 +963,7 @@ model_meta:
707
  is_external: true
708
  is_proprietary: false
709
  is_sentence_transformers_compatible: false
 
710
  mistral-embed:
711
  link: https://docs.mistral.ai/guides/embeddings
712
  seq_len: null
@@ -715,6 +972,7 @@ model_meta:
715
  is_external: true
716
  is_proprietary: true
717
  is_sentence_transformers_compatible: false
 
718
  monobert-large-msmarco:
719
  link: https://huggingface.co/castorini/monobert-large-msmarco
720
  seq_len: 512
@@ -723,6 +981,7 @@ model_meta:
723
  is_external: true
724
  is_proprietary: false
725
  is_sentence_transformers_compatible: false
 
726
  monot5-3b-msmarco-10k:
727
  link: https://huggingface.co/castorini/monot5-3b-msmarco-10k
728
  seq_len: 512
@@ -731,6 +990,7 @@ model_meta:
731
  is_external: true
732
  is_proprietary: false
733
  is_sentence_transformers_compatible: false
 
734
  monot5-base-msmarco-10k:
735
  link: https://huggingface.co/castorini/monot5-base-msmarco-10k
736
  seq_len: 512
@@ -739,6 +999,7 @@ model_meta:
739
  is_external: true
740
  is_proprietary: false
741
  is_sentence_transformers_compatible: false
 
742
  msmarco-bert-co-condensor:
743
  link: https://huggingface.co/sentence-transformers/msmarco-bert-co-condensor
744
  seq_len: 512
@@ -747,6 +1008,7 @@ model_meta:
747
  is_external: true
748
  is_proprietary: false
749
  is_sentence_transformers_compatible: true
 
750
  multi-qa-MiniLM-L6-cos-v1:
751
  link: https://huggingface.co/sentence-transformers/multi-qa-MiniLM-L6-cos-v1
752
  seq_len: 512
@@ -755,6 +1017,7 @@ model_meta:
755
  is_external: true
756
  is_proprietary: false
757
  is_sentence_transformers_compatible: true
 
758
  multilingual-e5-base:
759
  link: https://huggingface.co/intfloat/multilingual-e5-base
760
  seq_len: 514
@@ -763,6 +1026,7 @@ model_meta:
763
  is_external: true
764
  is_proprietary: false
765
  is_sentence_transformers_compatible: true
 
766
  multilingual-e5-large:
767
  link: https://huggingface.co/intfloat/multilingual-e5-large
768
  seq_len: 514
@@ -771,6 +1035,7 @@ model_meta:
771
  is_external: true
772
  is_proprietary: false
773
  is_sentence_transformers_compatible: true
 
774
  multilingual-e5-small:
775
  link: https://huggingface.co/intfloat/multilingual-e5-small
776
  seq_len: 512
@@ -779,6 +1044,7 @@ model_meta:
779
  is_external: true
780
  is_proprietary: false
781
  is_sentence_transformers_compatible: true
 
782
  nb-bert-base:
783
  link: https://huggingface.co/NbAiLab/nb-bert-base
784
  seq_len: 512
@@ -787,6 +1053,7 @@ model_meta:
787
  is_external: true
788
  is_proprietary: false
789
  is_sentence_transformers_compatible: true
 
790
  nb-bert-large:
791
  link: https://huggingface.co/NbAiLab/nb-bert-large
792
  seq_len: 512
@@ -795,6 +1062,7 @@ model_meta:
795
  is_external: true
796
  is_proprietary: false
797
  is_sentence_transformers_compatible: true
 
798
  nomic-embed-text-v1:
799
  link: https://huggingface.co/nomic-ai/nomic-embed-text-v1
800
  seq_len: 8192
@@ -803,6 +1071,7 @@ model_meta:
803
  is_external: true
804
  is_proprietary: false
805
  is_sentence_transformers_compatible: true
 
806
  nomic-embed-text-v1.5-128:
807
  link: https://huggingface.co/nomic-ai/nomic-embed-text-v1.5
808
  seq_len: 8192
@@ -811,6 +1080,7 @@ model_meta:
811
  is_external: true
812
  is_proprietary: false
813
  is_sentence_transformers_compatible: true
 
814
  nomic-embed-text-v1.5-256:
815
  link: https://huggingface.co/nomic-ai/nomic-embed-text-v1.5
816
  seq_len: 8192
@@ -819,6 +1089,7 @@ model_meta:
819
  is_external: true
820
  is_proprietary: false
821
  is_sentence_transformers_compatible: true
 
822
  nomic-embed-text-v1.5-512:
823
  link: https://huggingface.co/nomic-ai/nomic-embed-text-v1.5
824
  seq_len: 8192
@@ -827,6 +1098,7 @@ model_meta:
827
  is_external: true
828
  is_proprietary: false
829
  is_sentence_transformers_compatible: true
 
830
  nomic-embed-text-v1.5-64:
831
  link: https://huggingface.co/nomic-ai/nomic-embed-text-v1.5
832
  seq_len: 8192
@@ -835,6 +1107,7 @@ model_meta:
835
  is_external: true
836
  is_proprietary: false
837
  is_sentence_transformers_compatible: true
 
838
  norbert3-base:
839
  link: https://huggingface.co/ltg/norbert3-base
840
  seq_len: 512
@@ -843,6 +1116,7 @@ model_meta:
843
  is_external: true
844
  is_proprietary: false
845
  is_sentence_transformers_compatible: true
 
846
  norbert3-large:
847
  link: https://huggingface.co/ltg/norbert3-large
848
  seq_len: 512
@@ -851,6 +1125,7 @@ model_meta:
851
  is_external: true
852
  is_proprietary: false
853
  is_sentence_transformers_compatible: true
 
854
  paraphrase-multilingual-MiniLM-L12-v2:
855
  link: https://huggingface.co/sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2
856
  seq_len: 512
@@ -859,6 +1134,7 @@ model_meta:
859
  is_external: true
860
  is_proprietary: false
861
  is_sentence_transformers_compatible: true
 
862
  paraphrase-multilingual-mpnet-base-v2:
863
  link: https://huggingface.co/sentence-transformers/paraphrase-multilingual-mpnet-base-v2
864
  seq_len: 514
@@ -867,6 +1143,7 @@ model_meta:
867
  is_external: true
868
  is_proprietary: false
869
  is_sentence_transformers_compatible: true
 
870
  sentence-bert-swedish-cased:
871
  link: https://huggingface.co/KBLab/sentence-bert-swedish-cased
872
  seq_len: 512
@@ -875,6 +1152,7 @@ model_meta:
875
  is_external: true
876
  is_proprietary: false
877
  is_sentence_transformers_compatible: true
 
878
  sentence-camembert-base:
879
  link: https://huggingface.co/dangvantuan/sentence-camembert-base
880
  seq_len: 512
@@ -883,6 +1161,7 @@ model_meta:
883
  is_external: true
884
  is_proprietary: false
885
  is_sentence_transformers_compatible: true
 
886
  sentence-camembert-large:
887
  link: https://huggingface.co/dangvantuan/sentence-camembert-large
888
  seq_len: 512
@@ -891,6 +1170,7 @@ model_meta:
891
  is_external: true
892
  is_proprietary: false
893
  is_sentence_transformers_compatible: true
 
894
  sentence-croissant-llm-base:
895
  link: https://huggingface.co/Wissam42/sentence-croissant-llm-base
896
  seq_len: 2048
@@ -899,6 +1179,7 @@ model_meta:
899
  is_external: true
900
  is_proprietary: false
901
  is_sentence_transformers_compatible: true
 
902
  sentence-t5-base:
903
  link: https://huggingface.co/sentence-transformers/sentence-t5-base
904
  seq_len: 512
@@ -907,6 +1188,7 @@ model_meta:
907
  is_external: true
908
  is_proprietary: false
909
  is_sentence_transformers_compatible: true
 
910
  sentence-t5-large:
911
  link: https://huggingface.co/sentence-transformers/sentence-t5-large
912
  seq_len: 512
@@ -915,6 +1197,7 @@ model_meta:
915
  is_external: true
916
  is_proprietary: false
917
  is_sentence_transformers_compatible: true
 
918
  sentence-t5-xl:
919
  link: https://huggingface.co/sentence-transformers/sentence-t5-xl
920
  seq_len: 512
@@ -923,6 +1206,7 @@ model_meta:
923
  is_external: true
924
  is_proprietary: false
925
  is_sentence_transformers_compatible: true
 
926
  sentence-t5-xxl:
927
  link: https://huggingface.co/sentence-transformers/sentence-t5-xxl
928
  seq_len: 512
@@ -931,6 +1215,7 @@ model_meta:
931
  is_external: true
932
  is_proprietary: false
933
  is_sentence_transformers_compatible: true
 
934
  silver-retriever-base-v1:
935
  link: https://huggingface.co/ipipan/silver-retriever-base-v1
936
  seq_len: 514
@@ -939,6 +1224,7 @@ model_meta:
939
  is_external: true
940
  is_proprietary: false
941
  is_sentence_transformers_compatible: true
 
942
  st-polish-paraphrase-from-distilroberta:
943
  link: https://huggingface.co/sdadas/st-polish-paraphrase-from-distilroberta
944
  seq_len: 514
@@ -947,6 +1233,7 @@ model_meta:
947
  is_external: true
948
  is_proprietary: false
949
  is_sentence_transformers_compatible: true
 
950
  st-polish-paraphrase-from-mpnet:
951
  link: https://huggingface.co/sdadas/st-polish-paraphrase-from-mpnet
952
  seq_len: 514
@@ -955,6 +1242,7 @@ model_meta:
955
  is_external: true
956
  is_proprietary: false
957
  is_sentence_transformers_compatible: true
 
958
  sup-simcse-bert-base-uncased:
959
  link: https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased
960
  seq_len: 512
@@ -963,6 +1251,7 @@ model_meta:
963
  is_external: true
964
  is_proprietary: false
965
  is_sentence_transformers_compatible: true
 
966
  text-embedding-3-large:
967
  link: https://openai.com/blog/new-embedding-models-and-api-updates
968
  seq_len: 8191
@@ -971,6 +1260,16 @@ model_meta:
971
  is_external: true
972
  is_proprietary: true
973
  is_sentence_transformers_compatible: false
 
 
 
 
 
 
 
 
 
 
974
  text-embedding-3-large-256:
975
  link: https://openai.com/blog/new-embedding-models-and-api-updates
976
  seq_len: 8191
@@ -979,6 +1278,7 @@ model_meta:
979
  is_external: true
980
  is_proprietary: true
981
  is_sentence_transformers_compatible: false
 
982
  text-embedding-3-small:
983
  link: https://openai.com/blog/new-embedding-models-and-api-updates
984
  seq_len: 8191
@@ -987,6 +1287,16 @@ model_meta:
987
  is_external: true
988
  is_proprietary: true
989
  is_sentence_transformers_compatible: false
 
 
 
 
 
 
 
 
 
 
990
  text-embedding-ada-002:
991
  link: https://openai.com/blog/new-and-improved-embedding-model
992
  seq_len: 8191
@@ -995,6 +1305,16 @@ model_meta:
995
  is_external: true
996
  is_proprietary: true
997
  is_sentence_transformers_compatible: false
 
 
 
 
 
 
 
 
 
 
998
  text-search-ada-001:
999
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1000
  seq_len: 2046
@@ -1003,6 +1323,7 @@ model_meta:
1003
  is_external: true
1004
  is_proprietary: true
1005
  is_sentence_transformers_compatible: false
 
1006
  text-search-ada-doc-001:
1007
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1008
  seq_len: 2046
@@ -1011,6 +1332,7 @@ model_meta:
1011
  is_external: true
1012
  is_proprietary: true
1013
  is_sentence_transformers_compatible: false
 
1014
  text-search-ada-query-001:
1015
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1016
  seq_len: 2046
@@ -1019,6 +1341,7 @@ model_meta:
1019
  is_external: false
1020
  is_proprietary: true
1021
  is_sentence_transformers_compatible: false
 
1022
  text-search-babbage-001:
1023
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1024
  seq_len: 2046
@@ -1027,6 +1350,7 @@ model_meta:
1027
  is_external: true
1028
  is_proprietary: true
1029
  is_sentence_transformers_compatible: false
 
1030
  text-search-curie-001:
1031
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1032
  seq_len: 2046
@@ -1035,6 +1359,7 @@ model_meta:
1035
  is_external: true
1036
  is_proprietary: true
1037
  is_sentence_transformers_compatible: false
 
1038
  text-search-davinci-001:
1039
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1040
  seq_len: 2046
@@ -1043,6 +1368,7 @@ model_meta:
1043
  is_external: true
1044
  is_proprietary: true
1045
  is_sentence_transformers_compatible: false
 
1046
  text-similarity-ada-001:
1047
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1048
  seq_len: 2046
@@ -1051,6 +1377,7 @@ model_meta:
1051
  is_external: true
1052
  is_proprietary: true
1053
  is_sentence_transformers_compatible: false
 
1054
  text-similarity-babbage-001:
1055
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1056
  seq_len: 2046
@@ -1059,6 +1386,7 @@ model_meta:
1059
  is_external: true
1060
  is_proprietary: true
1061
  is_sentence_transformers_compatible: false
 
1062
  text-similarity-curie-001:
1063
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1064
  seq_len: 2046
@@ -1067,6 +1395,7 @@ model_meta:
1067
  is_external: true
1068
  is_proprietary: true
1069
  is_sentence_transformers_compatible: false
 
1070
  text-similarity-davinci-001:
1071
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1072
  seq_len: 2046
@@ -1075,6 +1404,7 @@ model_meta:
1075
  is_external: true
1076
  is_proprietary: true
1077
  is_sentence_transformers_compatible: false
 
1078
  tart-dual-contriever-msmarco:
1079
  link: https://huggingface.co/orionweller/tart-dual-contriever-msmarco
1080
  seq_len: 512
@@ -1083,6 +1413,7 @@ model_meta:
1083
  is_external: true
1084
  is_proprietary: false
1085
  is_sentence_transformers_compatible: false
 
1086
  tart-full-flan-t5-xl:
1087
  link: https://huggingface.co/facebook/tart-full-flan-t5-xl
1088
  seq_len: 512
@@ -1091,6 +1422,7 @@ model_meta:
1091
  is_external: true
1092
  is_proprietary: false
1093
  is_sentence_transformers_compatible: false
 
1094
  text2vec-base-chinese:
1095
  link: https://huggingface.co/shibing624/text2vec-base-chinese
1096
  seq_len: 512
@@ -1099,6 +1431,7 @@ model_meta:
1099
  is_external: true
1100
  is_proprietary: false
1101
  is_sentence_transformers_compatible: true
 
1102
  text2vec-base-multilingual:
1103
  link: null
1104
  seq_len: null
@@ -1107,6 +1440,7 @@ model_meta:
1107
  is_external: true
1108
  is_proprietary: false
1109
  is_sentence_transformers_compatible: false
 
1110
  text2vec-large-chinese:
1111
  link: https://huggingface.co/GanymedeNil/text2vec-large-chinese
1112
  seq_len: 512
@@ -1115,6 +1449,7 @@ model_meta:
1115
  is_external: true
1116
  is_proprietary: false
1117
  is_sentence_transformers_compatible: true
 
1118
  titan-embed-text-v1:
1119
  link: https://docs.aws.amazon.com/bedrock/latest/userguide/embeddings.html
1120
  seq_len: 8000
@@ -1123,6 +1458,7 @@ model_meta:
1123
  is_external: true
1124
  is_proprietary: true
1125
  is_sentence_transformers_compatible: false
 
1126
  udever-bloom-1b1:
1127
  link: https://huggingface.co/izhx/udever-bloom-1b1
1128
  seq_len: 2048
@@ -1131,6 +1467,7 @@ model_meta:
1131
  is_external: true
1132
  is_proprietary: false
1133
  is_sentence_transformers_compatible: true
 
1134
  udever-bloom-560m:
1135
  link: https://huggingface.co/izhx/udever-bloom-560m
1136
  seq_len: 2048
@@ -1139,6 +1476,7 @@ model_meta:
1139
  is_external: true
1140
  is_proprietary: false
1141
  is_sentence_transformers_compatible: true
 
1142
  universal-sentence-encoder-multilingual-3:
1143
  link: https://huggingface.co/vprelovac/universal-sentence-encoder-multilingual-3
1144
  seq_len: 512
@@ -1147,6 +1485,7 @@ model_meta:
1147
  is_external: true
1148
  is_proprietary: false
1149
  is_sentence_transformers_compatible: true
 
1150
  universal-sentence-encoder-multilingual-large-3:
1151
  link: https://huggingface.co/vprelovac/universal-sentence-encoder-multilingual-large-3
1152
  seq_len: 512
@@ -1155,6 +1494,7 @@ model_meta:
1155
  is_external: true
1156
  is_proprietary: false
1157
  is_sentence_transformers_compatible: true
 
1158
  unsup-simcse-bert-base-uncased:
1159
  link: https://huggingface.co/princeton-nlp/unsup-simcse-bert-base-uncased
1160
  seq_len: 512
@@ -1163,6 +1503,7 @@ model_meta:
1163
  is_external: true
1164
  is_proprietary: false
1165
  is_sentence_transformers_compatible: true
 
1166
  use-cmlm-multilingual:
1167
  link: https://huggingface.co/sentence-transformers/use-cmlm-multilingual
1168
  seq_len: 512
@@ -1171,6 +1512,7 @@ model_meta:
1171
  is_external: true
1172
  is_proprietary: false
1173
  is_sentence_transformers_compatible: true
 
1174
  voyage-2:
1175
  link: https://docs.voyageai.com/embeddings/
1176
  seq_len: 1024
@@ -1179,6 +1521,7 @@ model_meta:
1179
  is_external: true
1180
  is_proprietary: true
1181
  is_sentence_transformers_compatible: false
 
1182
  voyage-code-2:
1183
  link: https://docs.voyageai.com/embeddings/
1184
  seq_len: 16000
@@ -1187,6 +1530,7 @@ model_meta:
1187
  is_external: true
1188
  is_proprietary: true
1189
  is_sentence_transformers_compatible: false
 
1190
  voyage-large-2-instruct:
1191
  link: https://docs.voyageai.com/embeddings/
1192
  seq_len: 16000
@@ -1195,6 +1539,7 @@ model_meta:
1195
  is_external: true
1196
  is_proprietary: false
1197
  is_sentence_transformers_compatible: false
 
1198
  voyage-law-2:
1199
  link: https://docs.voyageai.com/embeddings/
1200
  seq_len: 16000
@@ -1203,6 +1548,7 @@ model_meta:
1203
  is_external: true
1204
  is_proprietary: true
1205
  is_sentence_transformers_compatible: false
 
1206
  voyage-lite-01-instruct:
1207
  link: https://docs.voyageai.com/embeddings/
1208
  seq_len: 4000
@@ -1211,6 +1557,7 @@ model_meta:
1211
  is_external: true
1212
  is_proprietary: true
1213
  is_sentence_transformers_compatible: false
 
1214
  voyage-lite-02-instruct:
1215
  link: https://docs.voyageai.com/embeddings/
1216
  seq_len: 4000
@@ -1219,6 +1566,7 @@ model_meta:
1219
  is_external: true
1220
  is_proprietary: true
1221
  is_sentence_transformers_compatible: false
 
1222
  voyage-multilingual-2:
1223
  link: https://docs.voyageai.com/embeddings/
1224
  seq_len: 32000
@@ -1227,6 +1575,7 @@ model_meta:
1227
  is_external: true
1228
  is_proprietary: true
1229
  is_sentence_transformers_compatible: false
 
1230
  xlm-roberta-base:
1231
  link: https://huggingface.co/xlm-roberta-base
1232
  seq_len: 514
@@ -1235,6 +1584,7 @@ model_meta:
1235
  is_external: true
1236
  is_proprietary: false
1237
  is_sentence_transformers_compatible: true
 
1238
  xlm-roberta-large:
1239
  link: https://huggingface.co/xlm-roberta-large
1240
  seq_len: 514
@@ -1243,30 +1593,7 @@ model_meta:
1243
  is_external: true
1244
  is_proprietary: false
1245
  is_sentence_transformers_compatible: true
1246
- NV-Retriever-v1:
1247
- link: https://huggingface.co/nvidia/NV-Retriever-v1
1248
- seq_len: 512
1249
- size: 7111
1250
- dim: 4096
1251
- is_external: false
1252
- is_proprietary: false
1253
- is_sentence_transformers_compatible: false
1254
- NV-Embed-v1:
1255
- link: https://huggingface.co/nvidia/NV-Embed-v1
1256
- seq_len: 32768
1257
- size: 7851
1258
- dim: 4096
1259
- is_external: false
1260
- is_proprietary: false
1261
- is_sentence_transformers_compatible: false
1262
- Linq-Embed-Mistral:
1263
- link: https://huggingface.co/Linq-AI-Research/Linq-Embed-Mistral
1264
- seq_len: 32768
1265
- size: 7111
1266
- dim: 4096
1267
- is_external: false
1268
- is_proprietary: false
1269
- is_sentence_transformers_compatible: true
1270
  models_to_skip:
1271
  - michaelfeil/ct2fast-e5-large-v2
1272
  - McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp-unsup-simcse
 
7
  is_external: true
8
  is_proprietary: true
9
  is_sentence_transformers_compatible: false
10
+ uses_instruct: false
11
  Cohere-embed-english-v3.0:
12
  link: https://huggingface.co/Cohere/Cohere-embed-english-v3.0
13
  seq_len: 512
 
16
  is_external: true
17
  is_proprietary: true
18
  is_sentence_transformers_compatible: false
19
+ uses_instruct: false
20
+ Cohere-embed-english-v3.0-instruct:
21
+ link: https://huggingface.co/Cohere/Cohere-embed-english-v3.0
22
+ seq_len: 512
23
+ size: null
24
+ dim: 1024
25
+ is_external: true
26
+ is_proprietary: true
27
+ is_sentence_transformers_compatible: false
28
+ uses_instruct: true
29
  Cohere-embed-multilingual-light-v3.0:
30
  link: https://huggingface.co/Cohere/Cohere-embed-multilingual-light-v3.0
31
  seq_len: 512
 
34
  is_external: true
35
  is_proprietary: true
36
  is_sentence_transformers_compatible: false
37
+ uses_instruct: false
38
  Cohere-embed-multilingual-v3.0:
39
  link: https://huggingface.co/Cohere/Cohere-embed-multilingual-v3.0
40
  seq_len: 512
 
43
  is_external: true
44
  is_proprietary: true
45
  is_sentence_transformers_compatible: false
46
+ uses_instruct: false
47
  DanskBERT:
48
  link: https://huggingface.co/vesteinn/DanskBERT
49
  seq_len: 514
 
52
  is_external: true
53
  is_proprietary: false
54
  is_sentence_transformers_compatible: true
55
+ uses_instruct: false
56
  FollowIR-7B:
57
  link: https://huggingface.co/jhu-clsp/FollowIR-7B
58
  seq_len: 4096
 
60
  is_external: true
61
  is_propietary: false
62
  is_sentence_transformer_compatible: false
63
+ uses_instruct: true
64
  GritLM-7B:
65
  link: https://huggingface.co/GritLM/GritLM-7B
66
  seq_len: 4096
 
68
  is_external: true
69
  is_propietary: false
70
  is_sentence_transformer_compatible: false
71
+ uses_instruct: true
72
+ GritLM-7B-noinstruct:
73
+ link: https://huggingface.co/GritLM/GritLM-7B
74
+ seq_len: 4096
75
+ size: 7240
76
+ is_external: true
77
+ is_propietary: false
78
+ is_sentence_transformer_compatible: false
79
+ uses_instruct: false
80
  LASER2:
81
  link: https://github.com/facebookresearch/LASER
82
  seq_len: N/A
 
85
  is_external: true
86
  is_proprietary: false
87
  is_sentence_transformers_compatible: false
88
+ uses_instruct: false
89
  LLM2Vec-Llama-2-supervised:
90
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Llama-2-7b-chat-hf-mntp-supervised
91
  seq_len: 4096
 
94
  is_external: true
95
  is_proprietary: false
96
  is_sentence_transformers_compatible: false
97
+ uses_instruct: true
98
  LLM2Vec-Llama-2-unsupervised:
99
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Llama-2-7b-chat-hf-mntp-unsup-simcse
100
  seq_len: 4096
 
103
  is_external: true
104
  is_proprietary: false
105
  is_sentence_transformers_compatible: false
106
+ uses_instruct: true
107
  LLM2Vec-Meta-Llama-3-supervised:
108
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Meta-Llama-3-8B-Instruct-mntp-supervised
109
  seq_len: 8192
 
112
  is_external: true
113
  is_proprietary: false
114
  is_sentence_transformers_compatible: false
115
+ uses_instruct: true
116
  LLM2Vec-Meta-Llama-3-unsupervised:
117
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Meta-Llama-3-8B-Instruct-mntp-unsup-simcse
118
  seq_len: 8192
 
121
  is_external: true
122
  is_proprietary: false
123
  is_sentence_transformers_compatible: false
124
+ uses_instruct: true
125
  LLM2Vec-Mistral-supervised:
126
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Mistral-7B-Instruct-v2-mntp-supervised
127
  seq_len: 32768
 
130
  is_external: true
131
  is_proprietary: false
132
  is_sentence_transformers_compatible: false
133
+ uses_instruct: true
134
  LLM2Vec-Mistral-unsupervised:
135
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Mistral-7B-Instruct-v2-mntp-unsup-simcse
136
  seq_len: 32768
 
139
  is_external: true
140
  is_proprietary: false
141
  is_sentence_transformers_compatible: false
142
+ uses_instruct: true
143
  LLM2Vec-Sheared-Llama-supervised:
144
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp-supervised
145
  seq_len: 4096
 
148
  is_external: true
149
  is_proprietary: false
150
  is_sentence_transformers_compatible: false
151
+ uses_instruct: true
152
  LLM2Vec-Sheared-Llama-unsupervised:
153
  link: https://huggingface.co/McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp-unsup-simcse
154
  seq_len: 4096
 
157
  is_external: true
158
  is_proprietary: false
159
  is_sentence_transformers_compatible: false
160
+ uses_instruct: true
161
  LaBSE:
162
  link: https://huggingface.co/sentence-transformers/LaBSE
163
  seq_len: 512
 
166
  is_external: true
167
  is_proprietary: false
168
  is_sentence_transformers_compatible: true
169
+ uses_instruct: false
170
+ Linq-Embed-Mistral:
171
+ link: https://huggingface.co/Linq-AI-Research/Linq-Embed-Mistral
172
+ seq_len: 32768
173
+ size: 7111
174
+ dim: 4096
175
+ is_external: false
176
+ is_proprietary: false
177
+ is_sentence_transformers_compatible: true
178
+ uses_instruct: true
179
+ NV-Embed-v1:
180
+ link: https://huggingface.co/nvidia/NV-Embed-v1
181
+ seq_len: 32768
182
+ size: 7851
183
+ dim: 4096
184
+ is_external: false
185
+ is_proprietary: false
186
+ is_sentence_transformers_compatible: false
187
+ uses_instruct: true
188
+ NV-Retriever-v1:
189
+ link: https://huggingface.co/nvidia/NV-Retriever-v1
190
+ seq_len: 512
191
+ size: 7111
192
+ dim: 4096
193
+ is_external: false
194
+ is_proprietary: false
195
+ is_sentence_transformers_compatible: false
196
+ uses_instruct: true
197
  OpenSearch-text-hybrid:
198
  link: https://help.aliyun.com/zh/open-search/vector-search-edition/hybrid-retrieval
199
  seq_len: 512
 
202
  is_external: true
203
  is_proprietary: true
204
  is_sentence_transformers_compatible: false
205
+ uses_instruct: false
206
  SFR-Embedding-Mistral:
207
  link: https://huggingface.co/Salesforce/SFR-Embedding-Mistral
208
  seq_len: 32768
 
211
  is_external: true
212
  is_proprietary: false
213
  is_sentence_transformers_compatible: true
214
+ uses_instruct: true
215
  all-MiniLM-L12-v2:
216
  link: https://huggingface.co/sentence-transformers/all-MiniLM-L12-v2
217
  seq_len: 512
 
220
  is_external: true
221
  is_proprietary: false
222
  is_sentence_transformers_compatible: true
223
+ uses_instruct: false
224
  all-MiniLM-L6-v2:
225
  link: https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2
226
  seq_len: 512
 
229
  is_external: true
230
  is_proprietary: false
231
  is_sentence_transformers_compatible: true
232
+ uses_instruct: false
233
+ all-MiniLM-L6-v2-instruct:
234
+ link: https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2
235
+ seq_len: 512
236
+ size: 23
237
+ dim: 384
238
+ is_external: true
239
+ is_proprietary: false
240
+ is_sentence_transformers_compatible: true
241
+ uses_instruct: true
242
  all-mpnet-base-v2:
243
  link: https://huggingface.co/sentence-transformers/all-mpnet-base-v2
244
  seq_len: 514
 
247
  is_external: true
248
  is_proprietary: false
249
  is_sentence_transformers_compatible: true
250
+ uses_instruct: false
251
+ all-mpnet-base-v2-instruct:
252
+ link: https://huggingface.co/sentence-transformers/all-mpnet-base-v2
253
+ seq_len: 514
254
+ size: 110
255
+ dim: 768
256
+ is_external: true
257
+ is_proprietary: false
258
+ is_sentence_transformers_compatible: true
259
+ uses_instruct: true
260
  allenai-specter:
261
  link: https://huggingface.co/sentence-transformers/allenai-specter
262
  seq_len: 512
 
265
  is_external: true
266
  is_proprietary: false
267
  is_sentence_transformers_compatible: true
268
+ uses_instruct: false
269
  bert-base-10lang-cased:
270
  link: https://huggingface.co/Geotrend/bert-base-10lang-cased
271
  seq_len: 512
 
274
  is_external: true
275
  is_proprietary: false
276
  is_sentence_transformers_compatible: true
277
+ uses_instruct: false
278
  bert-base-15lang-cased:
279
  link: https://huggingface.co/Geotrend/bert-base-15lang-cased
280
  seq_len: 512
 
283
  is_external: true
284
  is_proprietary: false
285
  is_sentence_transformers_compatible: true
286
+ uses_instruct: false
287
  bert-base-25lang-cased:
288
  link: https://huggingface.co/Geotrend/bert-base-25lang-cased
289
  seq_len: 512
 
292
  is_external: true
293
  is_proprietary: false
294
  is_sentence_transformers_compatible: true
295
+ uses_instruct: false
296
  bert-base-multilingual-cased:
297
  link: https://huggingface.co/google-bert/bert-base-multilingual-cased
298
  seq_len: 512
 
301
  is_external: true
302
  is_proprietary: false
303
  is_sentence_transformers_compatible: true
304
+ uses_instruct: false
305
  bert-base-multilingual-uncased:
306
  link: https://huggingface.co/google-bert/bert-base-multilingual-uncased
307
  seq_len: 512
 
310
  is_external: true
311
  is_proprietary: false
312
  is_sentence_transformers_compatible: true
313
+ uses_instruct: false
314
  bert-base-swedish-cased:
315
  link: https://huggingface.co/KB/bert-base-swedish-cased
316
  seq_len: 512
 
319
  is_external: true
320
  is_proprietary: false
321
  is_sentence_transformers_compatible: true
322
+ uses_instruct: false
323
  bert-base-uncased:
324
  link: https://huggingface.co/bert-base-uncased
325
  seq_len: 512
 
328
  is_external: true
329
  is_proprietary: false
330
  is_sentence_transformers_compatible: true
331
+ uses_instruct: false
332
+ bge-base-en-v1.5:
333
+ link: https://huggingface.co/BAAI/bge-base-en-v1.5
334
+ seq_len: 512
335
+ size: 438
336
+ dim: 768
337
+ is_external: true
338
+ is_proprietary: false
339
+ is_sentence_transformers_compatible: false
340
+ uses_instruct: false
341
+ bge-base-en-v1.5-instruct:
342
+ link: https://huggingface.co/BAAI/bge-base-en-v1.5
343
+ seq_len: 512
344
+ size: 438
345
+ dim: 768
346
+ is_external: true
347
+ is_proprietary: false
348
+ is_sentence_transformers_compatible: false
349
+ uses_instruct: true
350
  bge-base-zh-v1.5:
351
  link: https://huggingface.co/BAAI/bge-base-zh-v1.5
352
  seq_len: 512
 
355
  is_external: true
356
  is_proprietary: false
357
  is_sentence_transformers_compatible: true
358
+ uses_instruct: false
359
  bge-large-en-v1.5:
360
  link: https://huggingface.co/BAAI/bge-large-en-v1.5
361
  seq_len: 512
362
+ size: 1340
363
+ dim: 1024
364
+ is_external: true
365
+ is_proprietary: false
366
+ is_sentence_transformers_compatible: false
367
+ uses_instruct: false
368
+ bge-large-en-v1.5-instruct:
369
+ link: https://huggingface.co/BAAI/bge-large-en-v1.5
370
+ seq_len: 512
371
+ size: 1340
372
  dim: 1024
373
  is_external: true
374
  is_proprietary: false
375
  is_sentence_transformers_compatible: false
376
+ uses_instruct: true
377
  bge-large-zh-noinstruct:
378
  link: https://huggingface.co/BAAI/bge-large-zh-noinstruct
379
  seq_len: 512
 
382
  is_external: true
383
  is_proprietary: false
384
  is_sentence_transformers_compatible: true
385
+ uses_instruct: false
386
  bge-large-zh-v1.5:
387
  link: https://huggingface.co/BAAI/bge-large-zh-v1.5
388
  seq_len: 512
 
391
  is_external: true
392
  is_proprietary: false
393
  is_sentence_transformers_compatible: true
394
+ uses_instruct: false
395
  bge-m3:
396
  link: https://huggingface.co/BAAI/bge-m3
397
  seq_len: 8192
 
400
  is_external: true
401
  is_proprietary: false
402
  is_sentence_transformers_compatible: false
403
+ uses_instruct: false
404
+ bge-m3-instruct:
405
+ link: https://huggingface.co/BAAI/bge-m3
406
+ seq_len: 8192
407
+ size: 2270
408
+ dim: 1024
409
+ is_external: true
410
+ is_proprietary: false
411
+ is_sentence_transformers_compatible: false
412
+ uses_instruct: true
413
+ bge-small-en-v1.5:
414
+ link: https://huggingface.co/BAAI/bge-small-en-v1.5
415
+ seq_len: 512
416
+ size: 24
417
+ dim: 512
418
+ is_external: true
419
+ is_proprietary: false
420
+ is_sentence_transformers_compatible: true
421
+ uses_instruct: false
422
+ bge-small-en-v1.5-instruct:
423
+ link: https://huggingface.co/BAAI/bge-small-en-v1.5
424
+ seq_len: 512
425
+ size: 24
426
+ dim: 512
427
+ is_external: true
428
+ is_proprietary: false
429
+ is_sentence_transformers_compatible: true
430
+ uses_instruct: true
431
  bge-small-zh-v1.5:
432
  link: https://huggingface.co/BAAI/bge-small-zh-v1.5
433
  seq_len: 512
 
436
  is_external: true
437
  is_proprietary: false
438
  is_sentence_transformers_compatible: true
439
+ uses_instruct: false
440
+ bm25:
441
  link: https://en.wikipedia.org/wiki/Okapi_BM25
442
  size: 0
443
  is_external: true
444
  is_proprietary: false
445
  is_sentence_transformers_compatible: false
446
+ uses_instruct: false
447
+ bm25s:
448
+ link: https://github.com/xhluca/bm25s
449
+ size: 0
450
+ is_external: true
451
+ is_proprietary: false
452
+ is_sentence_transformers_compatible: false
453
+ uses_instruct: false
454
  camembert-base:
455
  link: https://huggingface.co/almanach/camembert-base
456
  seq_len: 512
 
459
  is_external: false
460
  is_proprietary: false
461
  is_sentence_transformers_compatible: true
462
+ uses_instruct: false
463
  camembert-large:
464
  link: https://huggingface.co/almanach/camembert-large
465
  seq_len: 512
 
468
  is_external: false
469
  is_proprietary: false
470
  is_sentence_transformers_compatible: true
471
+ uses_instruct: false
472
  contriever-base-msmarco:
473
  link: https://huggingface.co/nthakur/contriever-base-msmarco
474
  seq_len: 512
 
477
  is_external: true
478
  is_proprietary: false
479
  is_sentence_transformers_compatible: true
480
+ uses_instruct: false
481
+ contriever:
482
+ link: https://huggingface.co/facebook/contriever
483
+ seq_len: 512
484
+ size: 438
485
+ dim: 768
486
+ is_external: true
487
+ is_proprietary: false
488
+ is_sentence_transformers_compatible: false
489
+ uses_instruct: false
490
+ contriever-instruct:
491
+ link: https://huggingface.co/facebook/contriever
492
+ seq_len: 512
493
+ size: 438
494
+ dim: 768
495
+ is_external: true
496
+ is_proprietary: false
497
+ is_sentence_transformers_compatible: false
498
+ uses_instruct: true
499
  cross-en-de-roberta-sentence-transformer:
500
  link: https://huggingface.co/T-Systems-onsite/cross-en-de-roberta-sentence-transformer
501
  seq_len: 514
 
504
  is_external: true
505
  is_proprietary: false
506
  is_sentence_transformers_compatible: true
507
+ uses_instruct: false
508
  dfm-encoder-large-v1:
509
  link: https://huggingface.co/chcaa/dfm-encoder-large-v1
510
  seq_len: 512
 
513
  is_external: true
514
  is_proprietary: false
515
  is_sentence_transformers_compatible: true
516
+ uses_instruct: false
517
  dfm-sentence-encoder-large-1:
518
  link: https://huggingface.co/chcaa/dfm-encoder-large-v1
519
  seq_len: 512
 
522
  is_external: true
523
  is_proprietary: false
524
  is_sentence_transformers_compatible: true
525
+ uses_instruct: false
526
  distilbert-base-25lang-cased:
527
  link: https://huggingface.co/Geotrend/distilbert-base-25lang-cased
528
  seq_len: 512
 
531
  is_external: false
532
  is_proprietary: false
533
  is_sentence_transformers_compatible: true
534
+ uses_instruct: false
535
  distilbert-base-en-fr-cased:
536
  link: https://huggingface.co/Geotrend/distilbert-base-en-fr-cased
537
  seq_len: 512
 
540
  is_external: false
541
  is_proprietary: false
542
  is_sentence_transformers_compatible: true
543
+ uses_instruct: false
544
  distilbert-base-en-fr-es-pt-it-cased:
545
  link: https://huggingface.co/Geotrend/distilbert-base-en-fr-es-pt-it-cased
546
  seq_len: 512
 
549
  is_external: false
550
  is_proprietary: false
551
  is_sentence_transformers_compatible: true
552
+ uses_instruct: false
553
  distilbert-base-fr-cased:
554
  link: https://huggingface.co/Geotrend/distilbert-base-fr-cased
555
  seq_len: 512
 
558
  is_external: false
559
  is_proprietary: false
560
  is_sentence_transformers_compatible: true
561
+ uses_instruct: false
562
  distilbert-base-uncased:
563
  link: https://huggingface.co/distilbert-base-uncased
564
  seq_len: 512
 
567
  is_external: false
568
  is_proprietary: false
569
  is_sentence_transformers_compatible: true
570
+ uses_instruct: false
571
  distiluse-base-multilingual-cased-v2:
572
  link: https://huggingface.co/sentence-transformers/distiluse-base-multilingual-cased-v2
573
  seq_len: 512
 
576
  is_external: true
577
  is_proprietary: false
578
  is_sentence_transformers_compatible: true
579
+ uses_instruct: false
580
+ dragon-plus:
581
+ link: https://github.com/facebookresearch/dpr-scale/tree/main/dragon
582
+ seq_len: 512
583
+ size: 438
584
+ dim: 768
585
+ is_external: true
586
+ is_proprietary: false
587
+ is_sentence_transformers_compatible: false
588
+ uses_instruct: false
589
+ dragon-plus-instruct:
590
+ link: https://github.com/facebookresearch/dpr-scale/tree/main/dragon
591
+ seq_len: 512
592
+ size: 438
593
+ dim: 768
594
+ is_external: true
595
+ is_proprietary: false
596
+ is_sentence_transformers_compatible: false
597
+ uses_instruct: true
598
  e5-base-4k:
599
  link: https://huggingface.co/dwzhu/e5-base-4k
600
  seq_len: 512
 
603
  is_external: true
604
  is_proprietary: false
605
  is_sentence_transformers_compatible: true
606
+ uses_instruct: false
607
  e5-base-v2:
608
  link: https://huggingface.co/intfloat/e5-base-v2
609
  seq_len: 512
 
612
  is_external: true
613
  is_proprietary: false
614
  is_sentence_transformers_compatible: true
615
+ uses_instruct: false
616
  e5-base:
617
  link: https://huggingface.co/intfloat/e5-base
618
  seq_len: 512
 
621
  is_external: true
622
  is_proprietary: false
623
  is_sentence_transformers_compatible: true
624
+ uses_instruct: false
625
  e5-large-v2:
626
  link: https://huggingface.co/intfloat/e5-large-v2
627
  seq_len: 512
 
630
  is_external: true
631
  is_proprietary: false
632
  is_sentence_transformers_compatible: true
633
+ uses_instruct: false
634
  e5-large:
635
  link: https://huggingface.co/intfloat/e5-large
636
  seq_len: 512
 
639
  is_external: true
640
  is_proprietary: false
641
  is_sentence_transformers_compatible: true
642
+ uses_instruct: false
643
  e5-mistral-7b-instruct:
644
  link: https://huggingface.co/intfloat/e5-mistral-7b-instruct
645
  seq_len: 32768
 
648
  is_external: true
649
  is_proprietary: false
650
  is_sentence_transformers_compatible: true
651
+ uses_instruct: true
652
+ e5-mistral-7b-instruct-noinstruct:
653
+ link: https://huggingface.co/intfloat/e5-mistral-7b-instruct-noinstruct
654
+ seq_len: 32768
655
+ size: 7111
656
+ dim: 4096
657
+ is_external: true
658
+ is_proprietary: false
659
+ is_sentence_transformers_compatible: true
660
+ uses_instruct: false
661
  e5-small:
662
  link: https://huggingface.co/intfloat/e5-small
663
  seq_len: 512
 
666
  is_external: true
667
  is_proprietary: false
668
  is_sentence_transformers_compatible: true
669
+ uses_instruct: false
670
  electra-small-nordic:
671
  link: https://huggingface.co/jonfd/electra-small-nordic
672
  seq_len: 512
 
675
  is_external: true
676
  is_proprietary: false
677
  is_sentence_transformers_compatible: true
678
+ uses_instruct: false
679
  electra-small-swedish-cased-discriminator:
680
  link: https://huggingface.co/KBLab/electra-small-swedish-cased-discriminator
681
  seq_len: 512
 
684
  is_external: true
685
  is_proprietary: false
686
  is_sentence_transformers_compatible: true
687
+ uses_instruct: false
688
  elser-v2:
689
  link: https://www.elastic.co/guide/en/machine-learning/current/ml-nlp-elser.html
690
  seq_len: 512
 
693
  is_external: true
694
  is_proprietary: false
695
  is_sentence_transformers_compatible: false
696
+ uses_instruct: false
697
  flan-t5-base:
698
  link: https://huggingface.co/google/flan-t5-base
699
  seq_len: 512
 
702
  is_external: true
703
  is_proprietary: false
704
  is_sentence_transformers_compatible: true
705
+ uses_instruct: true
706
  flan-t5-large:
707
  link: https://huggingface.co/google/flan-t5-large
708
  seq_len: 512
 
711
  is_external: true
712
  is_proprietary: false
713
  is_sentence_transformers_compatible: true
714
+ uses_instruct: true
715
  flaubert_base_cased:
716
  link: https://huggingface.co/flaubert/flaubert_base_cased
717
  seq_len: 512
 
720
  is_external: true
721
  is_proprietary: false
722
  is_sentence_transformers_compatible: true
723
+ uses_instruct: false
724
  flaubert_base_uncased:
725
  link: https://huggingface.co/flaubert/flaubert_base_uncased
726
  seq_len: 512
 
729
  is_external: true
730
  is_proprietary: false
731
  is_sentence_transformers_compatible: true
732
+ uses_instruct: false
733
  flaubert_large_cased:
734
  link: https://huggingface.co/flaubert/flaubert_large_cased
735
  seq_len: 512
 
738
  is_external: true
739
  is_proprietary: false
740
  is_sentence_transformers_compatible: true
741
+ uses_instruct: false
742
  gbert-base:
743
  link: https://huggingface.co/deepset/gbert-base
744
  seq_len: 512
 
747
  is_external: true
748
  is_proprietary: false
749
  is_sentence_transformers_compatible: true
750
+ uses_instruct: false
751
  gbert-large:
752
  link: https://huggingface.co/deepset/gbert-large
753
  seq_len: 512
 
756
  is_external: true
757
  is_proprietary: false
758
  is_sentence_transformers_compatible: true
759
+ uses_instruct: false
760
  gelectra-base:
761
  link: https://huggingface.co/deepset/gelectra-base
762
  seq_len: 512
 
765
  is_external: true
766
  is_proprietary: false
767
  is_sentence_transformers_compatible: true
768
+ uses_instruct: false
769
  gelectra-large:
770
  link: https://huggingface.co/deepset/gelectra-large
771
  seq_len: 512
 
774
  is_external: true
775
  is_proprietary: false
776
  is_sentence_transformers_compatible: true
777
+ uses_instruct: false
778
  glove.6B.300d:
779
  link: https://huggingface.co/sentence-transformers/average_word_embeddings_glove.6B.300d
780
  seq_len: N/A
 
783
  is_external: true
784
  is_proprietary: false
785
  is_sentence_transformers_compatible: true
786
+ uses_instruct: false
787
  google-gecko-256.text-embedding-preview-0409:
788
  link: https://cloud.google.com/vertex-ai/generative-ai/docs/embeddings/get-text-embeddings#latest_models
789
  seq_len: 2048
 
792
  is_external: true
793
  is_proprietary: true
794
  is_sentence_transformers_compatible: false
795
+ uses_instruct: false
796
  google-gecko.text-embedding-preview-0409:
797
  link: https://cloud.google.com/vertex-ai/generative-ai/docs/embeddings/get-text-embeddings#latest_models
798
  seq_len: 2048
 
801
  is_external: true
802
  is_proprietary: true
803
  is_sentence_transformers_compatible: false
804
+ uses_instruct: false
805
  gottbert-base:
806
  link: https://huggingface.co/uklfr/gottbert-base
807
  seq_len: 512
 
810
  is_external: true
811
  is_proprietary: false
812
  is_sentence_transformers_compatible: true
813
+ uses_instruct: false
814
  gte-Qwen1.5-7B-instruct:
815
  link: https://huggingface.co/Alibaba-NLP/gte-Qwen1.5-7B-instruct
816
  seq_len: 32768
 
819
  is_external: true
820
  is_proprietary: false
821
  is_sentence_transformers_compatible: true
822
+ uses_instruct: true
823
  gte-Qwen2-7B-instruct:
824
  link: https://huggingface.co/Alibaba-NLP/gte-Qwen2-7B-instruct
825
  seq_len: 32768
 
828
  is_external: true
829
  is_proprietary: false
830
  is_sentence_transformers_compatible: true
831
+ uses_instruct: true
832
  gtr-t5-base:
833
  link: https://huggingface.co/sentence-transformers/gtr-t5-base
834
  seq_len: 512
 
837
  is_external: true
838
  is_proprietary: false
839
  is_sentence_transformers_compatible: true
840
+ uses_instruct: false
841
  gtr-t5-large:
842
  link: https://huggingface.co/sentence-transformers/gtr-t5-large
843
  seq_len: 512
 
846
  is_external: true
847
  is_proprietary: false
848
  is_sentence_transformers_compatible: true
849
+ uses_instruct: false
850
  gtr-t5-xl:
851
  link: https://huggingface.co/sentence-transformers/gtr-t5-xl
852
  seq_len: 512
 
855
  is_external: true
856
  is_proprietary: false
857
  is_sentence_transformers_compatible: true
858
+ uses_instruct: false
859
  gtr-t5-xxl:
860
  link: https://huggingface.co/sentence-transformers/gtr-t5-xxl
861
  seq_len: 512
 
864
  is_external: true
865
  is_proprietary: false
866
  is_sentence_transformers_compatible: true
867
+ uses_instruct: false
868
  herbert-base-retrieval-v2:
869
  link: https://huggingface.co/ipipan/herbert-base-retrieval-v2
870
  seq_len: 514
 
873
  is_external: true
874
  is_proprietary: false
875
  is_sentence_transformers_compatible: true
876
+ uses_instruct: false
877
  instructor-base:
878
  link: https://huggingface.co/hkunlp/instructor-base
879
  seq_len: N/A
 
882
  is_external: true
883
  is_proprietary: false
884
  is_sentence_transformers_compatible: true
885
+ uses_instruct: true
886
  instructor-large:
887
  link: https://huggingface.co/hkunlp/instructor-large
888
  seq_len: 512
 
891
  is_external: true
892
  is_proprietary: false
893
  is_sentence_transformers_compatible: true
894
+ uses_instruct: true
895
  instructor-xl:
896
  link: https://huggingface.co/hkunlp/instructor-xl
897
  seq_len: 512
 
900
  is_external: true
901
  is_proprietary: false
902
  is_sentence_transformers_compatible: true
903
+ uses_instruct: true
904
  jina-embeddings-v2-base-en:
905
  link: https://huggingface.co/jinaai/jina-embeddings-v2-base-en
906
  seq_len: 8192
 
909
  is_external: true
910
  is_proprietary: false
911
  is_sentence_transformers_compatible: true
912
+ uses_instruct: false
913
  komninos:
914
  link: https://huggingface.co/sentence-transformers/average_word_embeddings_komninos
915
  seq_len: N/A
 
918
  is_external: true
919
  is_proprietary: false
920
  is_sentence_transformers_compatible: true
921
+ uses_instruct: false
922
  llama-2-7b-chat:
923
  link: https://huggingface.co/meta-llama/Llama-2-7b-chat-hf
924
  seq_len: 4096
 
927
  is_external: true
928
  is_proprietary: false
929
  is_sentence_transformers_compatible: false
930
+ uses_instruct: true
931
  luotuo-bert-medium:
932
  link: https://huggingface.co/silk-road/luotuo-bert-medium
933
  seq_len: 512
 
936
  is_external: true
937
  is_proprietary: false
938
  is_sentence_transformers_compatible: true
939
+ uses_instruct: false
940
  m3e-base:
941
  link: https://huggingface.co/moka-ai/m3e-base
942
  seq_len: 512
 
945
  is_external: true
946
  is_proprietary: false
947
  is_sentence_transformers_compatible: true
948
+ uses_instruct: false
949
  m3e-large:
950
  link: https://huggingface.co/moka-ai/m3e-large
951
  seq_len: 512
 
954
  is_external: true
955
  is_proprietary: false
956
  is_sentence_transformers_compatible: true
957
+ uses_instruct: false
958
  mistral-7b-instruct-v0.2:
959
  link: https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2
960
  seq_len: 4096
 
963
  is_external: true
964
  is_proprietary: false
965
  is_sentence_transformers_compatible: false
966
+ uses_instruct: true
967
  mistral-embed:
968
  link: https://docs.mistral.ai/guides/embeddings
969
  seq_len: null
 
972
  is_external: true
973
  is_proprietary: true
974
  is_sentence_transformers_compatible: false
975
+ uses_instruct: false
976
  monobert-large-msmarco:
977
  link: https://huggingface.co/castorini/monobert-large-msmarco
978
  seq_len: 512
 
981
  is_external: true
982
  is_proprietary: false
983
  is_sentence_transformers_compatible: false
984
+ uses_instruct: false
985
  monot5-3b-msmarco-10k:
986
  link: https://huggingface.co/castorini/monot5-3b-msmarco-10k
987
  seq_len: 512
 
990
  is_external: true
991
  is_proprietary: false
992
  is_sentence_transformers_compatible: false
993
+ uses_instruct: true
994
  monot5-base-msmarco-10k:
995
  link: https://huggingface.co/castorini/monot5-base-msmarco-10k
996
  seq_len: 512
 
999
  is_external: true
1000
  is_proprietary: false
1001
  is_sentence_transformers_compatible: false
1002
+ uses_instruct: true
1003
  msmarco-bert-co-condensor:
1004
  link: https://huggingface.co/sentence-transformers/msmarco-bert-co-condensor
1005
  seq_len: 512
 
1008
  is_external: true
1009
  is_proprietary: false
1010
  is_sentence_transformers_compatible: true
1011
+ uses_instruct: false
1012
  multi-qa-MiniLM-L6-cos-v1:
1013
  link: https://huggingface.co/sentence-transformers/multi-qa-MiniLM-L6-cos-v1
1014
  seq_len: 512
 
1017
  is_external: true
1018
  is_proprietary: false
1019
  is_sentence_transformers_compatible: true
1020
+ uses_instruct: false
1021
  multilingual-e5-base:
1022
  link: https://huggingface.co/intfloat/multilingual-e5-base
1023
  seq_len: 514
 
1026
  is_external: true
1027
  is_proprietary: false
1028
  is_sentence_transformers_compatible: true
1029
+ uses_instruct: false
1030
  multilingual-e5-large:
1031
  link: https://huggingface.co/intfloat/multilingual-e5-large
1032
  seq_len: 514
 
1035
  is_external: true
1036
  is_proprietary: false
1037
  is_sentence_transformers_compatible: true
1038
+ uses_instruct: false
1039
  multilingual-e5-small:
1040
  link: https://huggingface.co/intfloat/multilingual-e5-small
1041
  seq_len: 512
 
1044
  is_external: true
1045
  is_proprietary: false
1046
  is_sentence_transformers_compatible: true
1047
+ uses_instruct: false
1048
  nb-bert-base:
1049
  link: https://huggingface.co/NbAiLab/nb-bert-base
1050
  seq_len: 512
 
1053
  is_external: true
1054
  is_proprietary: false
1055
  is_sentence_transformers_compatible: true
1056
+ uses_instruct: false
1057
  nb-bert-large:
1058
  link: https://huggingface.co/NbAiLab/nb-bert-large
1059
  seq_len: 512
 
1062
  is_external: true
1063
  is_proprietary: false
1064
  is_sentence_transformers_compatible: true
1065
+ uses_instruct: false
1066
  nomic-embed-text-v1:
1067
  link: https://huggingface.co/nomic-ai/nomic-embed-text-v1
1068
  seq_len: 8192
 
1071
  is_external: true
1072
  is_proprietary: false
1073
  is_sentence_transformers_compatible: true
1074
+ uses_instruct: false
1075
  nomic-embed-text-v1.5-128:
1076
  link: https://huggingface.co/nomic-ai/nomic-embed-text-v1.5
1077
  seq_len: 8192
 
1080
  is_external: true
1081
  is_proprietary: false
1082
  is_sentence_transformers_compatible: true
1083
+ uses_instruct: false
1084
  nomic-embed-text-v1.5-256:
1085
  link: https://huggingface.co/nomic-ai/nomic-embed-text-v1.5
1086
  seq_len: 8192
 
1089
  is_external: true
1090
  is_proprietary: false
1091
  is_sentence_transformers_compatible: true
1092
+ uses_instruct: false
1093
  nomic-embed-text-v1.5-512:
1094
  link: https://huggingface.co/nomic-ai/nomic-embed-text-v1.5
1095
  seq_len: 8192
 
1098
  is_external: true
1099
  is_proprietary: false
1100
  is_sentence_transformers_compatible: true
1101
+ uses_instruct: false
1102
  nomic-embed-text-v1.5-64:
1103
  link: https://huggingface.co/nomic-ai/nomic-embed-text-v1.5
1104
  seq_len: 8192
 
1107
  is_external: true
1108
  is_proprietary: false
1109
  is_sentence_transformers_compatible: true
1110
+ uses_instruct: false
1111
  norbert3-base:
1112
  link: https://huggingface.co/ltg/norbert3-base
1113
  seq_len: 512
 
1116
  is_external: true
1117
  is_proprietary: false
1118
  is_sentence_transformers_compatible: true
1119
+ uses_instruct: false
1120
  norbert3-large:
1121
  link: https://huggingface.co/ltg/norbert3-large
1122
  seq_len: 512
 
1125
  is_external: true
1126
  is_proprietary: false
1127
  is_sentence_transformers_compatible: true
1128
+ uses_instruct: false
1129
  paraphrase-multilingual-MiniLM-L12-v2:
1130
  link: https://huggingface.co/sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2
1131
  seq_len: 512
 
1134
  is_external: true
1135
  is_proprietary: false
1136
  is_sentence_transformers_compatible: true
1137
+ uses_instruct: false
1138
  paraphrase-multilingual-mpnet-base-v2:
1139
  link: https://huggingface.co/sentence-transformers/paraphrase-multilingual-mpnet-base-v2
1140
  seq_len: 514
 
1143
  is_external: true
1144
  is_proprietary: false
1145
  is_sentence_transformers_compatible: true
1146
+ uses_instruct: false
1147
  sentence-bert-swedish-cased:
1148
  link: https://huggingface.co/KBLab/sentence-bert-swedish-cased
1149
  seq_len: 512
 
1152
  is_external: true
1153
  is_proprietary: false
1154
  is_sentence_transformers_compatible: true
1155
+ uses_instruct: false
1156
  sentence-camembert-base:
1157
  link: https://huggingface.co/dangvantuan/sentence-camembert-base
1158
  seq_len: 512
 
1161
  is_external: true
1162
  is_proprietary: false
1163
  is_sentence_transformers_compatible: true
1164
+ uses_instruct: false
1165
  sentence-camembert-large:
1166
  link: https://huggingface.co/dangvantuan/sentence-camembert-large
1167
  seq_len: 512
 
1170
  is_external: true
1171
  is_proprietary: false
1172
  is_sentence_transformers_compatible: true
1173
+ uses_instruct: false
1174
  sentence-croissant-llm-base:
1175
  link: https://huggingface.co/Wissam42/sentence-croissant-llm-base
1176
  seq_len: 2048
 
1179
  is_external: true
1180
  is_proprietary: false
1181
  is_sentence_transformers_compatible: true
1182
+ uses_instruct: false
1183
  sentence-t5-base:
1184
  link: https://huggingface.co/sentence-transformers/sentence-t5-base
1185
  seq_len: 512
 
1188
  is_external: true
1189
  is_proprietary: false
1190
  is_sentence_transformers_compatible: true
1191
+ uses_instruct: false
1192
  sentence-t5-large:
1193
  link: https://huggingface.co/sentence-transformers/sentence-t5-large
1194
  seq_len: 512
 
1197
  is_external: true
1198
  is_proprietary: false
1199
  is_sentence_transformers_compatible: true
1200
+ uses_instruct: false
1201
  sentence-t5-xl:
1202
  link: https://huggingface.co/sentence-transformers/sentence-t5-xl
1203
  seq_len: 512
 
1206
  is_external: true
1207
  is_proprietary: false
1208
  is_sentence_transformers_compatible: true
1209
+ uses_instruct: false
1210
  sentence-t5-xxl:
1211
  link: https://huggingface.co/sentence-transformers/sentence-t5-xxl
1212
  seq_len: 512
 
1215
  is_external: true
1216
  is_proprietary: false
1217
  is_sentence_transformers_compatible: true
1218
+ uses_instruct: false
1219
  silver-retriever-base-v1:
1220
  link: https://huggingface.co/ipipan/silver-retriever-base-v1
1221
  seq_len: 514
 
1224
  is_external: true
1225
  is_proprietary: false
1226
  is_sentence_transformers_compatible: true
1227
+ uses_instruct: false
1228
  st-polish-paraphrase-from-distilroberta:
1229
  link: https://huggingface.co/sdadas/st-polish-paraphrase-from-distilroberta
1230
  seq_len: 514
 
1233
  is_external: true
1234
  is_proprietary: false
1235
  is_sentence_transformers_compatible: true
1236
+ uses_instruct: false
1237
  st-polish-paraphrase-from-mpnet:
1238
  link: https://huggingface.co/sdadas/st-polish-paraphrase-from-mpnet
1239
  seq_len: 514
 
1242
  is_external: true
1243
  is_proprietary: false
1244
  is_sentence_transformers_compatible: true
1245
+ uses_instruct: false
1246
  sup-simcse-bert-base-uncased:
1247
  link: https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased
1248
  seq_len: 512
 
1251
  is_external: true
1252
  is_proprietary: false
1253
  is_sentence_transformers_compatible: true
1254
+ uses_instruct: false
1255
  text-embedding-3-large:
1256
  link: https://openai.com/blog/new-embedding-models-and-api-updates
1257
  seq_len: 8191
 
1260
  is_external: true
1261
  is_proprietary: true
1262
  is_sentence_transformers_compatible: false
1263
+ uses_instruct: false
1264
+ text-embedding-3-large-instruct:
1265
+ link: https://openai.com/blog/new-embedding-models-and-api-updates
1266
+ seq_len: 8191
1267
+ size: null
1268
+ dim: 3072
1269
+ is_external: true
1270
+ is_proprietary: true
1271
+ is_sentence_transformers_compatible: false
1272
+ uses_instruct: true
1273
  text-embedding-3-large-256:
1274
  link: https://openai.com/blog/new-embedding-models-and-api-updates
1275
  seq_len: 8191
 
1278
  is_external: true
1279
  is_proprietary: true
1280
  is_sentence_transformers_compatible: false
1281
+ uses_instruct: false
1282
  text-embedding-3-small:
1283
  link: https://openai.com/blog/new-embedding-models-and-api-updates
1284
  seq_len: 8191
 
1287
  is_external: true
1288
  is_proprietary: true
1289
  is_sentence_transformers_compatible: false
1290
+ uses_instruct: false
1291
+ text-embedding-3-small-instruct:
1292
+ link: https://openai.com/blog/new-embedding-models-and-api-updates
1293
+ seq_len: 8191
1294
+ size: null
1295
+ dim: 1536
1296
+ is_external: true
1297
+ is_proprietary: true
1298
+ is_sentence_transformers_compatible: false
1299
+ uses_instruct: true
1300
  text-embedding-ada-002:
1301
  link: https://openai.com/blog/new-and-improved-embedding-model
1302
  seq_len: 8191
 
1305
  is_external: true
1306
  is_proprietary: true
1307
  is_sentence_transformers_compatible: false
1308
+ uses_instruct: false
1309
+ text-embedding-ada-002-instruct:
1310
+ link: https://openai.com/blog/new-and-improved-embedding-model
1311
+ seq_len: 8191
1312
+ size: null
1313
+ dim: 1536
1314
+ is_external: true
1315
+ is_proprietary: true
1316
+ is_sentence_transformers_compatible: false
1317
+ uses_instruct: true
1318
  text-search-ada-001:
1319
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1320
  seq_len: 2046
 
1323
  is_external: true
1324
  is_proprietary: true
1325
  is_sentence_transformers_compatible: false
1326
+ uses_instruct: false
1327
  text-search-ada-doc-001:
1328
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1329
  seq_len: 2046
 
1332
  is_external: true
1333
  is_proprietary: true
1334
  is_sentence_transformers_compatible: false
1335
+ uses_instruct: false
1336
  text-search-ada-query-001:
1337
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1338
  seq_len: 2046
 
1341
  is_external: false
1342
  is_proprietary: true
1343
  is_sentence_transformers_compatible: false
1344
+ uses_instruct: false
1345
  text-search-babbage-001:
1346
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1347
  seq_len: 2046
 
1350
  is_external: true
1351
  is_proprietary: true
1352
  is_sentence_transformers_compatible: false
1353
+ uses_instruct: false
1354
  text-search-curie-001:
1355
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1356
  seq_len: 2046
 
1359
  is_external: true
1360
  is_proprietary: true
1361
  is_sentence_transformers_compatible: false
1362
+ uses_instruct: false
1363
  text-search-davinci-001:
1364
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1365
  seq_len: 2046
 
1368
  is_external: true
1369
  is_proprietary: true
1370
  is_sentence_transformers_compatible: false
1371
+ uses_instruct: false
1372
  text-similarity-ada-001:
1373
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1374
  seq_len: 2046
 
1377
  is_external: true
1378
  is_proprietary: true
1379
  is_sentence_transformers_compatible: false
1380
+ uses_instruct: false
1381
  text-similarity-babbage-001:
1382
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1383
  seq_len: 2046
 
1386
  is_external: true
1387
  is_proprietary: true
1388
  is_sentence_transformers_compatible: false
1389
+ uses_instruct: false
1390
  text-similarity-curie-001:
1391
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1392
  seq_len: 2046
 
1395
  is_external: true
1396
  is_proprietary: true
1397
  is_sentence_transformers_compatible: false
1398
+ uses_instruct: false
1399
  text-similarity-davinci-001:
1400
  link: https://openai.com/blog/introducing-text-and-code-embeddings
1401
  seq_len: 2046
 
1404
  is_external: true
1405
  is_proprietary: true
1406
  is_sentence_transformers_compatible: false
1407
+ uses_instruct: false
1408
  tart-dual-contriever-msmarco:
1409
  link: https://huggingface.co/orionweller/tart-dual-contriever-msmarco
1410
  seq_len: 512
 
1413
  is_external: true
1414
  is_proprietary: false
1415
  is_sentence_transformers_compatible: false
1416
+ uses_instruct: true
1417
  tart-full-flan-t5-xl:
1418
  link: https://huggingface.co/facebook/tart-full-flan-t5-xl
1419
  seq_len: 512
 
1422
  is_external: true
1423
  is_proprietary: false
1424
  is_sentence_transformers_compatible: false
1425
+ uses_instruct: true
1426
  text2vec-base-chinese:
1427
  link: https://huggingface.co/shibing624/text2vec-base-chinese
1428
  seq_len: 512
 
1431
  is_external: true
1432
  is_proprietary: false
1433
  is_sentence_transformers_compatible: true
1434
+ uses_instruct: false
1435
  text2vec-base-multilingual:
1436
  link: null
1437
  seq_len: null
 
1440
  is_external: true
1441
  is_proprietary: false
1442
  is_sentence_transformers_compatible: false
1443
+ uses_instruct: false
1444
  text2vec-large-chinese:
1445
  link: https://huggingface.co/GanymedeNil/text2vec-large-chinese
1446
  seq_len: 512
 
1449
  is_external: true
1450
  is_proprietary: false
1451
  is_sentence_transformers_compatible: true
1452
+ uses_instruct: false
1453
  titan-embed-text-v1:
1454
  link: https://docs.aws.amazon.com/bedrock/latest/userguide/embeddings.html
1455
  seq_len: 8000
 
1458
  is_external: true
1459
  is_proprietary: true
1460
  is_sentence_transformers_compatible: false
1461
+ uses_instruct: false
1462
  udever-bloom-1b1:
1463
  link: https://huggingface.co/izhx/udever-bloom-1b1
1464
  seq_len: 2048
 
1467
  is_external: true
1468
  is_proprietary: false
1469
  is_sentence_transformers_compatible: true
1470
+ uses_instruct: false
1471
  udever-bloom-560m:
1472
  link: https://huggingface.co/izhx/udever-bloom-560m
1473
  seq_len: 2048
 
1476
  is_external: true
1477
  is_proprietary: false
1478
  is_sentence_transformers_compatible: true
1479
+ uses_instruct: false
1480
  universal-sentence-encoder-multilingual-3:
1481
  link: https://huggingface.co/vprelovac/universal-sentence-encoder-multilingual-3
1482
  seq_len: 512
 
1485
  is_external: true
1486
  is_proprietary: false
1487
  is_sentence_transformers_compatible: true
1488
+ uses_instruct: false
1489
  universal-sentence-encoder-multilingual-large-3:
1490
  link: https://huggingface.co/vprelovac/universal-sentence-encoder-multilingual-large-3
1491
  seq_len: 512
 
1494
  is_external: true
1495
  is_proprietary: false
1496
  is_sentence_transformers_compatible: true
1497
+ uses_instruct: false
1498
  unsup-simcse-bert-base-uncased:
1499
  link: https://huggingface.co/princeton-nlp/unsup-simcse-bert-base-uncased
1500
  seq_len: 512
 
1503
  is_external: true
1504
  is_proprietary: false
1505
  is_sentence_transformers_compatible: true
1506
+ uses_instruct: false
1507
  use-cmlm-multilingual:
1508
  link: https://huggingface.co/sentence-transformers/use-cmlm-multilingual
1509
  seq_len: 512
 
1512
  is_external: true
1513
  is_proprietary: false
1514
  is_sentence_transformers_compatible: true
1515
+ uses_instruct: false
1516
  voyage-2:
1517
  link: https://docs.voyageai.com/embeddings/
1518
  seq_len: 1024
 
1521
  is_external: true
1522
  is_proprietary: true
1523
  is_sentence_transformers_compatible: false
1524
+ uses_instruct: false
1525
  voyage-code-2:
1526
  link: https://docs.voyageai.com/embeddings/
1527
  seq_len: 16000
 
1530
  is_external: true
1531
  is_proprietary: true
1532
  is_sentence_transformers_compatible: false
1533
+ uses_instruct: false
1534
  voyage-large-2-instruct:
1535
  link: https://docs.voyageai.com/embeddings/
1536
  seq_len: 16000
 
1539
  is_external: true
1540
  is_proprietary: false
1541
  is_sentence_transformers_compatible: false
1542
+ uses_instruct: true
1543
  voyage-law-2:
1544
  link: https://docs.voyageai.com/embeddings/
1545
  seq_len: 16000
 
1548
  is_external: true
1549
  is_proprietary: true
1550
  is_sentence_transformers_compatible: false
1551
+ uses_instruct: false
1552
  voyage-lite-01-instruct:
1553
  link: https://docs.voyageai.com/embeddings/
1554
  seq_len: 4000
 
1557
  is_external: true
1558
  is_proprietary: true
1559
  is_sentence_transformers_compatible: false
1560
+ uses_instruct: true
1561
  voyage-lite-02-instruct:
1562
  link: https://docs.voyageai.com/embeddings/
1563
  seq_len: 4000
 
1566
  is_external: true
1567
  is_proprietary: true
1568
  is_sentence_transformers_compatible: false
1569
+ uses_instruct: true
1570
  voyage-multilingual-2:
1571
  link: https://docs.voyageai.com/embeddings/
1572
  seq_len: 32000
 
1575
  is_external: true
1576
  is_proprietary: true
1577
  is_sentence_transformers_compatible: false
1578
+ uses_instruct: false
1579
  xlm-roberta-base:
1580
  link: https://huggingface.co/xlm-roberta-base
1581
  seq_len: 514
 
1584
  is_external: true
1585
  is_proprietary: false
1586
  is_sentence_transformers_compatible: true
1587
+ uses_instruct: false
1588
  xlm-roberta-large:
1589
  link: https://huggingface.co/xlm-roberta-large
1590
  seq_len: 514
 
1593
  is_external: true
1594
  is_proprietary: false
1595
  is_sentence_transformers_compatible: true
1596
+ uses_instruct: false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1597
  models_to_skip:
1598
  - michaelfeil/ct2fast-e5-large-v2
1599
  - McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp-unsup-simcse
refresh.py CHANGED
@@ -1,7 +1,6 @@
1
  from functools import reduce
2
  import json
3
  import os
4
- import pickle
5
  import re
6
 
7
  from datasets import load_dataset
@@ -47,6 +46,8 @@ SENTENCE_TRANSFORMERS_COMPATIBLE_MODELS = {k for k,v in MODEL_META["model_meta"]
47
  MODELS_TO_SKIP = MODEL_META["models_to_skip"]
48
  CROSS_ENCODERS = MODEL_META["cross_encoders"]
49
  BI_ENCODERS = [k for k, _ in MODEL_META["model_meta"].items() if k not in CROSS_ENCODERS + ["bm25"]]
 
 
50
 
51
 
52
 
@@ -87,7 +88,7 @@ def make_clickable_model(model_name, link=None):
87
 
88
 
89
  def add_lang(examples):
90
- if not(examples["eval_language"]):
91
  examples["mteb_dataset_name_with_lang"] = examples["mteb_dataset_name"]
92
  else:
93
  examples["mteb_dataset_name_with_lang"] = examples["mteb_dataset_name"] + f' ({examples["eval_language"]})'
@@ -407,7 +408,7 @@ def refresh_leaderboard():
407
  pbar_tasks = tqdm(BOARDS_CONFIG.items(), desc="Fetching leaderboard results for ???", total=len(BOARDS_CONFIG), leave=True)
408
  for board, board_config in pbar_tasks:
409
  # To add only a single new board, you can uncomment the below to be faster
410
- # if board != "new_board_name": continue
411
  boards_data[board] = {
412
  "data_overall": None,
413
  "data_tasks": {}
 
1
  from functools import reduce
2
  import json
3
  import os
 
4
  import re
5
 
6
  from datasets import load_dataset
 
46
  MODELS_TO_SKIP = MODEL_META["models_to_skip"]
47
  CROSS_ENCODERS = MODEL_META["cross_encoders"]
48
  BI_ENCODERS = [k for k, _ in MODEL_META["model_meta"].items() if k not in CROSS_ENCODERS + ["bm25"]]
49
+ INSTRUCT_MODELS = {k for k,v in MODEL_META["model_meta"].items() if v.get("uses_instruct", False)}
50
+ NOINSTRUCT_MODELS = {k for k,v in MODEL_META["model_meta"].items() if not v.get("uses_instruct", False)}
51
 
52
 
53
 
 
88
 
89
 
90
  def add_lang(examples):
91
+ if not(examples["eval_language"]) or (examples["eval_language"] == "default"):
92
  examples["mteb_dataset_name_with_lang"] = examples["mteb_dataset_name"]
93
  else:
94
  examples["mteb_dataset_name_with_lang"] = examples["mteb_dataset_name"] + f' ({examples["eval_language"]})'
 
408
  pbar_tasks = tqdm(BOARDS_CONFIG.items(), desc="Fetching leaderboard results for ???", total=len(BOARDS_CONFIG), leave=True)
409
  for board, board_config in pbar_tasks:
410
  # To add only a single new board, you can uncomment the below to be faster
411
+ if board != "rar-b": continue
412
  boards_data[board] = {
413
  "data_overall": None,
414
  "data_tasks": {}