Benchmarks / results_virtuoso_small.py
Julien Simon
Add g6e.48xlarge
f011c00
raw
history blame
436 Bytes
"""Module containing performance results for the Virtuoso-Small model."""
results_virtuoso_small = {
"name": "Virtuoso-Small",
"modelType": "Qwen2.5 14B",
"configurations": [
{
"instanceType": "g6e.48xlarge",
"quantization": "none",
"container": "LMI 0.30+vLLM 0.6.2",
"status": "OK",
"tokensPerSecond": "78",
"notes": "",
},
],
}