Julien Simon commited on
Commit
d17a4c1
1 Parent(s): 2b18bbe

Add SuperNova on inf2 with LMI 0.30rc1

Browse files
Files changed (1) hide show
  1. results_arcee_supernova.py +16 -2
results_arcee_supernova.py CHANGED
@@ -106,6 +106,13 @@ results_arcee_supernova = {
106
  "tokensPerSecond": "32",
107
  "notes": "bs=2,seqlen=8192 - SDK 2.19.1",
108
  },
 
 
 
 
 
 
 
109
  ],
110
  },
111
  {
@@ -123,7 +130,7 @@ results_arcee_supernova = {
123
  "container": "LMI 0.29+vLLM 0.5.5",
124
  "status": "OK",
125
  "tokensPerSecond": "45",
126
- "notes": "",
127
  },
128
  ],
129
  },
@@ -142,7 +149,14 @@ results_arcee_supernova = {
142
  "container": "LMI 0.29+vLLM 0.5.5",
143
  "status": "OK",
144
  "tokensPerSecond": "70",
145
- "notes": "",
 
 
 
 
 
 
 
146
  },
147
  ],
148
  },
 
106
  "tokensPerSecond": "32",
107
  "notes": "bs=2,seqlen=8192 - SDK 2.19.1",
108
  },
109
+ {
110
+ "quantization": "none",
111
+ "container": "LMI 0.30rc1",
112
+ "status": "OK",
113
+ "tokensPerSecond": "34",
114
+ "notes": "bs=2,seqlen=8192 - SDK 2.20",
115
+ },
116
  ],
117
  },
118
  {
 
130
  "container": "LMI 0.29+vLLM 0.5.5",
131
  "status": "OK",
132
  "tokensPerSecond": "45",
133
+ "notes": "OPTION_MAX_MODEL_LEN 64k",
134
  },
135
  ],
136
  },
 
149
  "container": "LMI 0.29+vLLM 0.5.5",
150
  "status": "OK",
151
  "tokensPerSecond": "70",
152
+ "notes": "OPTION_MAX_MODEL_LEN 128k",
153
+ },
154
+ {
155
+ "quantization": "none",
156
+ "container": "LMI 0.29+vLLM 0.5.5",
157
+ "status": "OK",
158
+ "tokensPerSecond": "70",
159
+ "notes": "OPTION_ENFORCE_EAGER=True",
160
  },
161
  ],
162
  },