Benchmarks / results.py
Julien Simon
Add g6e.48xlarge
f011c00
raw
history blame
8.87 kB
"""Module containing model configuration results for various AI models and hardware setups."""
from results_arcee_agent import results_arcee_agent
from results_arcee_lite import results_arcee_lite
from results_arcee_meraj import results_arcee_meraj
from results_arcee_nova import results_arcee_nova
from results_arcee_scribe import results_arcee_scribe
from results_arcee_spark import results_arcee_spark
from results_arcee_supernova import results_arcee_supernova
from results_arcee_supernova_medius import results_arcee_supernova_medius
from results_llama_spark import results_llama_spark
from results_llama_supernova_lite import results_llama_supernova_lite
from results_virtuoso_large import results_virtuoso_large
from results_virtuoso_medium import results_virtuoso_medium
from results_virtuoso_small import results_virtuoso_small
instance_type_mappings = {
"g5.xlarge": {
"cloud": "AWS",
"gpu": "1xNVIDIA A10G",
"gpuRAM": "24 GB",
"url": "https://instances.vantage.sh/aws/ec2/g5.xlarge",
"price": 1.006,
},
"g5.2xlarge": {
"cloud": "AWS",
"gpu": "1xNVIDIA A10G",
"gpuRAM": "24 GB",
"url": "https://instances.vantage.sh/aws/ec2/g5.2xlarge",
"price": 1.212,
},
"g5.12xlarge": {
"cloud": "AWS",
"gpu": "4xNVIDIA A10G",
"gpuRAM": "96 GB",
"url": "https://instances.vantage.sh/aws/ec2/g5.12xlarge",
"price": 5.672,
},
"g5.48xlarge": {
"cloud": "AWS",
"gpu": "8xNVIDIA A10G",
"gpuRAM": "192 GB",
"url": "https://instances.vantage.sh/aws/ec2/g5.48xlarge",
"price": 16.288,
},
"g6.2xlarge": {
"cloud": "AWS",
"gpu": "1xNVIDIA L4",
"gpuRAM": "24 GB",
"url": "https://instances.vantage.sh/aws/ec2/g6.2xlarge",
"price": 0.9776,
},
"g6.12xlarge": {
"cloud": "AWS",
"gpu": "4xNVIDIA L4",
"gpuRAM": "96 GB",
"url": "https://instances.vantage.sh/aws/ec2/g6.12xlarge",
"price": 4.602,
},
"g6.48xlarge": {
"cloud": "AWS",
"gpu": "8xNVIDIA L4",
"gpuRAM": "192 GB",
"url": "https://instances.vantage.sh/aws/ec2/g6.48xlarge",
"price": 13.35,
},
"g6e.2xlarge": {
"cloud": "AWS",
"gpu": "1xNVIDIA L40S",
"gpuRAM": "48 GB",
"url": "https://instances.vantage.sh/aws/ec2/g6e.2xlarge",
"price": 2.242,
},
"g6e.12xlarge": {
"cloud": "AWS",
"gpu": "4xNVIDIA L40S",
"gpuRAM": "192 GB",
"url": "https://instances.vantage.sh/aws/ec2/g6e.12xlarge",
"price": 10.493,
},
"g6e.12xlarge (2 GPUs)": {
"cloud": "AWS",
"gpu": "2xNVIDIA L40S",
"gpuRAM": "96 GB",
"url": "https://instances.vantage.sh/aws/ec2/g6e.12xlarge",
"price": 5.2465,
},
"g6e.48xlarge": {
"cloud": "AWS",
"gpu": "8xNVIDIA L40S",
"gpuRAM": "192 GB",
"url": "https://instances.vantage.sh/aws/ec2/g6e.48xlarge",
"price": 30.131,
},
"g4dn.12xlarge": {
"cloud": "AWS",
"gpu": "4xNVIDIA T4",
"gpuRAM": "64 GB",
"url": "https://instances.vantage.sh/aws/ec2/g4dn.12xlarge",
"price": 3.912,
},
"p4d.24xlarge": {
"cloud": "AWS",
"gpu": "4xNVIDIA A100",
"gpuRAM": "320 GB",
"url": "https://instances.vantage.sh/aws/ec2/p4d.24xlarge",
"price": 32.773,
},
"p4de.24xlarge": {
"cloud": "AWS",
"gpu": "8xNVIDIA A100",
"gpuRAM": "320 GB",
"url": "https://instances.vantage.sh/aws/ec2/p4de.24xlarge",
"price": 40.966,
},
"p5.48xlarge": {
"cloud": "AWS",
"gpu": "8xNVIDIA H100",
"gpuRAM": "640GB",
"url": "https://instances.vantage.sh/aws/ec2/p5.48xlarge",
"price": 98.32,
},
"p5.48xlarge (4 GPUs)": {
"cloud": "AWS",
"gpu": "4xNVIDIA H100",
"gpuRAM": "320GB",
"url": "https://instances.vantage.sh/aws/ec2/p5.48xlarge",
"price": 49.16,
},
"p5.48xlarge (2 GPUs)": {
"cloud": "AWS",
"gpu": "2xNVIDIA H100",
"gpuRAM": "160GB",
"url": "https://instances.vantage.sh/aws/ec2/p5.48xlarge",
"price": 24.58,
},
"p5.48xlarge (1 GPU)": {
"cloud": "AWS",
"gpu": "1xNVIDIA H100",
"gpuRAM": "80GB",
"url": "https://instances.vantage.sh/aws/ec2/p5.48xlarge",
"price": 12.29,
},
"c6i.xlarge": {
"cloud": "AWS",
"gpu": "-",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c6i.xlarge",
},
"c6i.2xlarge": {
"cloud": "AWS",
"gpu": "-",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c6i.2xlarge",
"price": 0.34,
},
"c6i.4xlarge": {
"cloud": "AWS",
"gpu": "-",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c6i.4xlarge",
"price": 0.68,
},
"c7i.4xlarge": {
"cloud": "AWS",
"gpu": "-",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c7i.4xlarge",
"price": 0.714,
},
"c7g.2xlarge": {
"cloud": "AWS",
"gpu": "None - Graviton3, 16 vCPUs",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c7g.2xlarge",
"price": 0.29,
},
"c7g.4xlarge": {
"cloud": "AWS",
"gpu": "None - Graviton3, 16 vCPUs",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c7g.4xlarge",
"price": 0.58,
},
"c7g.8xlarge": {
"cloud": "AWS",
"gpu": "None - Graviton3, 32 vCPUs",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c7g.8xlarge",
"price": 1.16,
},
"c7g.16xlarge": {
"cloud": "AWS",
"gpu": "None - Graviton3, 64 vCPUs",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c7g.16xlarge",
"price": 2.32,
},
"c8g.4xlarge": {
"cloud": "AWS",
"gpu": "None - Graviton4, 16 vCPUs",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c8g.4xlarge",
"price": 0.6381,
},
"c8g.8xlarge": {
"cloud": "AWS",
"gpu": "None - Graviton4, 32 vCPUs",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c8g.8xlarge",
"price": 1.276,
},
"c8g.16xlarge": {
"cloud": "AWS",
"gpu": "None - Graviton4, 64 vCPUs",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/c8g.16xlarge",
"price": 2.552,
},
"r8g.4xlarge": {
"cloud": "AWS",
"gpu": "None - Graviton4, 16 vCPUs",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/r8g.4xlarge",
"price": 0.9426,
},
"r8g.8xlarge": {
"cloud": "AWS",
"gpu": "None - Graviton4, 32 vCPUs",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/r8g.8xlarge",
"price": 1.885,
},
"r8g.16xlarge": {
"cloud": "AWS",
"gpu": "None - Graviton4, 64 vCPUs",
"gpuRAM": "-",
"url": "https://instances.vantage.sh/aws/ec2/r8g.16xlarge",
"price": 3.77,
},
"inf2.xlarge": {
"cloud": "AWS",
"gpu": "2xNeuronCore v2",
"gpuRAM": "32 GB",
"url": "https://instances.vantage.sh/aws/ec2/inf2.2xlarge",
"price": 0.7582,
},
"inf2.8xlarge": {
"cloud": "AWS",
"gpu": "1xNeuronCore v2",
"gpuRAM": "32 GB",
"url": "https://instances.vantage.sh/aws/ec2/inf2.8xlarge",
"price": 1.968,
},
"inf2.24xlarge": {
"cloud": "AWS",
"gpu": "12xNeuronCore v2",
"gpuRAM": "192 GB",
"url": "https://instances.vantage.sh/aws/ec2/inf2.24xlarge",
"price": 6.491,
},
"inf2.48xlarge": {
"cloud": "AWS",
"gpu": "24xNeuronCore v2",
"gpuRAM": "384 GB",
"url": "https://instances.vantage.sh/aws/ec2/inf2.48xlarge",
"price": 12.981,
},
"trn1.32xlarge": {
"cloud": "AWS",
"gpu": "32xNeuronCore v2",
"gpuRAM": "512 GB",
"url": "https://instances.vantage.sh/aws/ec2/trn1.32xlarge",
"price": 21.50,
},
}
results = {
"models": [
results_arcee_meraj,
results_arcee_supernova,
results_arcee_nova,
results_llama_spark,
results_arcee_agent,
results_arcee_spark,
results_arcee_lite,
results_arcee_scribe,
results_llama_supernova_lite,
results_arcee_supernova_medius,
results_virtuoso_small,
results_virtuoso_medium,
results_virtuoso_large,
]
}