Benchmarks / results_arcee_meraj.py
Julien Simon
Update
b63ff12
raw
history blame
1.33 kB
"""Module containing performance results for the Arcee-Meraj model."""
results_arcee_meraj = {
"name": "Arcee-Meraj",
"modelType": "Qwen2 72B",
"configurations": [
{
"instanceType": "g5.12xlarge",
"quantization": "awq",
"container": "TGI 2.2.0",
"status": "OK",
"tokensPerSecond": "33",
"notes": "",
},
{
"instanceType": "g6e.12xlarge",
"quantization": "awq",
"container": "vLLM 0.5.5",
"status": "OK",
"tokensPerSecond": "45",
"notes": "",
},
{
"instanceType": "g6e.12xlarge",
"quantization": "awq",
"container": "TGI 2.2.0",
"status": "OK",
"tokensPerSecond": "46",
"notes": "",
},
{
"instanceType": "g6e.12xlarge",
"quantization": "awq",
"container": "SGLang 0.2.13",
"status": "OK",
"tokensPerSecond": "47.1",
"notes": "",
},
{
"instanceType": "p4d.24xlarge",
"quantization": "none",
"container": "TGI 2.2.0",
"status": "OK",
"tokensPerSecond": "38",
"notes": "",
},
],
}