Spaces:
Sleeping
Sleeping
Julien Simon
commited on
Commit
•
261211b
1
Parent(s):
ea42ef4
Add SuperNova 8-bit for inf2 and trn1
Browse files- results_arcee_supernova.py +14 -0
results_arcee_supernova.py
CHANGED
@@ -78,6 +78,13 @@ results_arcee_supernova = {
|
|
78 |
"tokensPerSecond": "-",
|
79 |
"notes": "OOM bs=2,seqlen=16384 - SDK 2.19.1",
|
80 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
81 |
],
|
82 |
},
|
83 |
{
|
@@ -90,6 +97,13 @@ results_arcee_supernova = {
|
|
90 |
"tokensPerSecond": "32",
|
91 |
"notes": "bs=2,seqlen=8192 - SDK 2.19.1",
|
92 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
93 |
],
|
94 |
},
|
95 |
{
|
|
|
78 |
"tokensPerSecond": "-",
|
79 |
"notes": "OOM bs=2,seqlen=16384 - SDK 2.19.1",
|
80 |
},
|
81 |
+
{
|
82 |
+
"quantization": "8-bit",
|
83 |
+
"container": "LMI 0.29+transformers-neuronx 0.11.351",
|
84 |
+
"status": "OK",
|
85 |
+
"tokensPerSecond": "14",
|
86 |
+
"notes": "bs=2,seqlen=8192 - SDK 2.19.1",
|
87 |
+
},
|
88 |
],
|
89 |
},
|
90 |
{
|
|
|
97 |
"tokensPerSecond": "32",
|
98 |
"notes": "bs=2,seqlen=8192 - SDK 2.19.1",
|
99 |
},
|
100 |
+
{
|
101 |
+
"quantization": "8-bit",
|
102 |
+
"container": "LMI 0.29+transformers-neuronx 0.11.351",
|
103 |
+
"status": "OK",
|
104 |
+
"tokensPerSecond": "24.6",
|
105 |
+
"notes": "bs=2,seqlen=8192 - SDK 2.19.1",
|
106 |
+
},
|
107 |
],
|
108 |
},
|
109 |
{
|