Julien Simon commited on
Commit
37a6a80
1 Parent(s): e009fe7

Add inf2.xlarge benchmark

Browse files
Files changed (1) hide show
  1. results_llama_spark.py +7 -0
results_llama_spark.py CHANGED
@@ -105,5 +105,12 @@ results_llama_spark = {
105
  "tokensPerSecond": "-",
106
  "notes": "Llama-3.1: TGI OK, Neuron SDK OK, optimum-neuron KO",
107
  },
 
 
 
 
 
 
 
108
  ],
109
  }
 
105
  "tokensPerSecond": "-",
106
  "notes": "Llama-3.1: TGI OK, Neuron SDK OK, optimum-neuron KO",
107
  },
108
+ {
109
+ "instanceType": "inf2.2xlarge",
110
+ "container": "transformers-neuronx 0.11.351",
111
+ "status": "OK",
112
+ "tokensPerSecond": "24",
113
+ "notes": "Neuron SDK 2.19.1",
114
+ },
115
  ],
116
  }