Julien Simon commited on
Commit
22854a2
1 Parent(s): 6b33c1f

SuperNova g6e.2xlarge

Browse files
Files changed (1) hide show
  1. results_arcee_supernova.py +8 -0
results_arcee_supernova.py CHANGED
@@ -36,6 +36,14 @@ results_arcee_supernova = {
36
  "tokensPerSecond": "18",
37
  "notes": "--max-model-len 10000 --max-num-seqs 16 --enforce-eager",
38
  },
 
 
 
 
 
 
 
 
39
  {
40
  "instanceType": "p4d.24xlarge",
41
  "quantization": "awq",
 
36
  "tokensPerSecond": "18",
37
  "notes": "--max-model-len 10000 --max-num-seqs 16 --enforce-eager",
38
  },
39
+ {
40
+ "instanceType": "g6e.2xlarge",
41
+ "quantization": "Q4_K_M",
42
+ "container": "llama.cpp 10/2/24",
43
+ "status": "OK",
44
+ "tokensPerSecond": "16",
45
+ "notes": "-ngl 81 -c 13000 -fa -t 8",
46
+ },
47
  {
48
  "instanceType": "p4d.24xlarge",
49
  "quantization": "awq",