Julien Simon commited on
Commit
31ed7d9
1 Parent(s): 246b217

Add SuperNova Lite on r8g.8xlarge

Browse files
Files changed (2) hide show
  1. results.py +7 -0
  2. results_llama_supernova_lite.py +9 -1
results.py CHANGED
@@ -157,6 +157,13 @@ instance_type_mappings = {
157
  "url": "https://instances.vantage.sh/aws/ec2/c7g.16xlarge",
158
  "price": 2.32,
159
  },
 
 
 
 
 
 
 
160
  "r8g.16xlarge": {
161
  "cloud": "AWS",
162
  "gpu": "None - Graviton4, 64 vCPUs",
 
157
  "url": "https://instances.vantage.sh/aws/ec2/c7g.16xlarge",
158
  "price": 2.32,
159
  },
160
+ "r8g.8xlarge": {
161
+ "cloud": "AWS",
162
+ "gpu": "None - Graviton4, 32 vCPUs",
163
+ "gpuRAM": "-",
164
+ "url": "https://instances.vantage.sh/aws/ec2/r8g.8xlarge",
165
+ "price": 1.885,
166
+ },
167
  "r8g.16xlarge": {
168
  "cloud": "AWS",
169
  "gpu": "None - Graviton4, 64 vCPUs",
results_llama_supernova_lite.py CHANGED
@@ -20,10 +20,18 @@ results_llama_supernova_lite = {
20
  "tokensPerSecond": "45.5",
21
  "notes": "",
22
  },
 
 
 
 
 
 
 
 
23
  {
24
  "instanceType": "r8g.16xlarge",
25
  "quantization": "Q4_0_4_8",
26
- "container": "llama.cpp 9/119/24",
27
  "status": "OK",
28
  "tokensPerSecond": "65",
29
  "notes": "",
 
20
  "tokensPerSecond": "45.5",
21
  "notes": "",
22
  },
23
+ {
24
+ "instanceType": "r8g.8xlarge",
25
+ "quantization": "Q4_0_4_8",
26
+ "container": "llama.cpp 9/11/24",
27
+ "status": "OK",
28
+ "tokensPerSecond": "57",
29
+ "notes": "",
30
+ },
31
  {
32
  "instanceType": "r8g.16xlarge",
33
  "quantization": "Q4_0_4_8",
34
+ "container": "llama.cpp 9/11/24",
35
  "status": "OK",
36
  "tokensPerSecond": "65",
37
  "notes": "",