Julien Simon commited on
Commit
ce1f985
1 Parent(s): 7f6d9bd

8K/16K works with SuperNova-AWQ on g5

Browse files
Files changed (1) hide show
  1. results_arcee_supernova.py +1 -1
results_arcee_supernova.py CHANGED
@@ -10,7 +10,7 @@ results_arcee_supernova = {
10
  "container": "TGI 2.2.0",
11
  "status": "OK",
12
  "tokensPerSecond": "33",
13
- "notes": "8K/16K",
14
  },
15
  {
16
  "instanceType": "inf2.24xlarge",
 
10
  "container": "TGI 2.2.0",
11
  "status": "OK",
12
  "tokensPerSecond": "33",
13
+ "notes": "MAX_INPUT_TOKENS: 8192, MAX_TOTAL_TOKENS: 16384",
14
  },
15
  {
16
  "instanceType": "inf2.24xlarge",