Julien Simon commited on
Commit
8639c9c
1 Parent(s): dc891f5

Add SuperNova on LMI+vLLM

Browse files
Files changed (1) hide show
  1. results_arcee_supernova.py +32 -10
results_arcee_supernova.py CHANGED
@@ -110,19 +110,41 @@ results_arcee_supernova = {
110
  },
111
  {
112
  "instanceType": "p4d.24xlarge",
113
- "quantization": "none",
114
- "container": "TGI 2.2.0",
115
- "status": "OK",
116
- "tokensPerSecond": "30",
117
- "notes": "",
 
 
 
 
 
 
 
 
 
 
 
118
  },
119
  {
120
  "instanceType": "p5.48xlarge",
121
- "quantization": "none",
122
- "container": "TGI 2.2.0",
123
- "status": "OK",
124
- "tokensPerSecond": "58",
125
- "notes": "MAX_INPUT_TOKENS: 16384, MAX_TOTAL_TOKENS: 32768",
 
 
 
 
 
 
 
 
 
 
 
126
  },
127
  ],
128
  }
 
110
  },
111
  {
112
  "instanceType": "p4d.24xlarge",
113
+ "configurations": [
114
+ {
115
+ "quantization": "none",
116
+ "container": "TGI 2.2.0",
117
+ "status": "OK",
118
+ "tokensPerSecond": "30",
119
+ "notes": "",
120
+ },
121
+ {
122
+ "quantization": "none",
123
+ "container": "LMI 0.29+vLLM 0.5.5",
124
+ "status": "OK",
125
+ "tokensPerSecond": "45",
126
+ "notes": "",
127
+ },
128
+ ],
129
  },
130
  {
131
  "instanceType": "p5.48xlarge",
132
+ "configurations": [
133
+ {
134
+ "quantization": "none",
135
+ "container": "TGI 2.2.0",
136
+ "status": "OK",
137
+ "tokensPerSecond": "58",
138
+ "notes": "MAX_INPUT_TOKENS: 16384, MAX_TOTAL_TOKENS: 32768",
139
+ },
140
+ {
141
+ "quantization": "none",
142
+ "container": "LMI 0.29+vLLM 0.5.5",
143
+ "status": "xxx",
144
+ "tokensPerSecond": "70",
145
+ "notes": "",
146
+ },
147
+ ],
148
  },
149
  ],
150
  }