Julien Simon commited on
Commit
261211b
1 Parent(s): ea42ef4

Add SuperNova 8-bit for inf2 and trn1

Browse files
Files changed (1) hide show
  1. results_arcee_supernova.py +14 -0
results_arcee_supernova.py CHANGED
@@ -78,6 +78,13 @@ results_arcee_supernova = {
78
  "tokensPerSecond": "-",
79
  "notes": "OOM bs=2,seqlen=16384 - SDK 2.19.1",
80
  },
 
 
 
 
 
 
 
81
  ],
82
  },
83
  {
@@ -90,6 +97,13 @@ results_arcee_supernova = {
90
  "tokensPerSecond": "32",
91
  "notes": "bs=2,seqlen=8192 - SDK 2.19.1",
92
  },
 
 
 
 
 
 
 
93
  ],
94
  },
95
  {
 
78
  "tokensPerSecond": "-",
79
  "notes": "OOM bs=2,seqlen=16384 - SDK 2.19.1",
80
  },
81
+ {
82
+ "quantization": "8-bit",
83
+ "container": "LMI 0.29+transformers-neuronx 0.11.351",
84
+ "status": "OK",
85
+ "tokensPerSecond": "14",
86
+ "notes": "bs=2,seqlen=8192 - SDK 2.19.1",
87
+ },
88
  ],
89
  },
90
  {
 
97
  "tokensPerSecond": "32",
98
  "notes": "bs=2,seqlen=8192 - SDK 2.19.1",
99
  },
100
+ {
101
+ "quantization": "8-bit",
102
+ "container": "LMI 0.29+transformers-neuronx 0.11.351",
103
+ "status": "OK",
104
+ "tokensPerSecond": "24.6",
105
+ "notes": "bs=2,seqlen=8192 - SDK 2.19.1",
106
+ },
107
  ],
108
  },
109
  {