Spaces:
Running
Running
Julien Simon
commited on
Commit
•
8639c9c
1
Parent(s):
dc891f5
Add SuperNova on LMI+vLLM
Browse files- results_arcee_supernova.py +32 -10
results_arcee_supernova.py
CHANGED
@@ -110,19 +110,41 @@ results_arcee_supernova = {
|
|
110 |
},
|
111 |
{
|
112 |
"instanceType": "p4d.24xlarge",
|
113 |
-
"
|
114 |
-
|
115 |
-
|
116 |
-
|
117 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
118 |
},
|
119 |
{
|
120 |
"instanceType": "p5.48xlarge",
|
121 |
-
"
|
122 |
-
|
123 |
-
|
124 |
-
|
125 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
126 |
},
|
127 |
],
|
128 |
}
|
|
|
110 |
},
|
111 |
{
|
112 |
"instanceType": "p4d.24xlarge",
|
113 |
+
"configurations": [
|
114 |
+
{
|
115 |
+
"quantization": "none",
|
116 |
+
"container": "TGI 2.2.0",
|
117 |
+
"status": "OK",
|
118 |
+
"tokensPerSecond": "30",
|
119 |
+
"notes": "",
|
120 |
+
},
|
121 |
+
{
|
122 |
+
"quantization": "none",
|
123 |
+
"container": "LMI 0.29+vLLM 0.5.5",
|
124 |
+
"status": "OK",
|
125 |
+
"tokensPerSecond": "45",
|
126 |
+
"notes": "",
|
127 |
+
},
|
128 |
+
],
|
129 |
},
|
130 |
{
|
131 |
"instanceType": "p5.48xlarge",
|
132 |
+
"configurations": [
|
133 |
+
{
|
134 |
+
"quantization": "none",
|
135 |
+
"container": "TGI 2.2.0",
|
136 |
+
"status": "OK",
|
137 |
+
"tokensPerSecond": "58",
|
138 |
+
"notes": "MAX_INPUT_TOKENS: 16384, MAX_TOTAL_TOKENS: 32768",
|
139 |
+
},
|
140 |
+
{
|
141 |
+
"quantization": "none",
|
142 |
+
"container": "LMI 0.29+vLLM 0.5.5",
|
143 |
+
"status": "xxx",
|
144 |
+
"tokensPerSecond": "70",
|
145 |
+
"notes": "",
|
146 |
+
},
|
147 |
+
],
|
148 |
},
|
149 |
],
|
150 |
}
|