Spaces:
Running
Running
Julien Simon
commited on
Commit
•
37a6a80
1
Parent(s):
e009fe7
Add inf2.xlarge benchmark
Browse files- results_llama_spark.py +7 -0
results_llama_spark.py
CHANGED
@@ -105,5 +105,12 @@ results_llama_spark = {
|
|
105 |
"tokensPerSecond": "-",
|
106 |
"notes": "Llama-3.1: TGI OK, Neuron SDK OK, optimum-neuron KO",
|
107 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
108 |
],
|
109 |
}
|
|
|
105 |
"tokensPerSecond": "-",
|
106 |
"notes": "Llama-3.1: TGI OK, Neuron SDK OK, optimum-neuron KO",
|
107 |
},
|
108 |
+
{
|
109 |
+
"instanceType": "inf2.2xlarge",
|
110 |
+
"container": "transformers-neuronx 0.11.351",
|
111 |
+
"status": "OK",
|
112 |
+
"tokensPerSecond": "24",
|
113 |
+
"notes": "Neuron SDK 2.19.1",
|
114 |
+
},
|
115 |
],
|
116 |
}
|