Spaces:
Running
Running
Julien Simon
commited on
Commit
·
d0c0894
1
Parent(s):
261211b
Add Arcee-Lite on c7g
Browse files- results.py +21 -0
- results_arcee_lite.py +22 -0
results.py
CHANGED
@@ -129,6 +129,27 @@ instance_type_mappings = {
|
|
129 |
"url": "https://instances.vantage.sh/aws/ec2/c7i.4xlarge",
|
130 |
"price": 0.714,
|
131 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
132 |
"inf2.xlarge": {
|
133 |
"cloud": "AWS",
|
134 |
"gpu": "2xNeuronCore v2",
|
|
|
129 |
"url": "https://instances.vantage.sh/aws/ec2/c7i.4xlarge",
|
130 |
"price": 0.714,
|
131 |
},
|
132 |
+
"c7g.2xlarge": {
|
133 |
+
"cloud": "AWS",
|
134 |
+
"gpu": "-",
|
135 |
+
"gpuRAM": "-",
|
136 |
+
"url": "https://instances.vantage.sh/aws/ec2/c7g.2xlarge",
|
137 |
+
"price": 0.29,
|
138 |
+
},
|
139 |
+
"c7g.4xlarge": {
|
140 |
+
"cloud": "AWS",
|
141 |
+
"gpu": "-",
|
142 |
+
"gpuRAM": "-",
|
143 |
+
"url": "https://instances.vantage.sh/aws/ec2/c7g.4xlarge",
|
144 |
+
"price": 0.58,
|
145 |
+
},
|
146 |
+
"c7g.8xlarge": {
|
147 |
+
"cloud": "AWS",
|
148 |
+
"gpu": "-",
|
149 |
+
"gpuRAM": "-",
|
150 |
+
"url": "https://instances.vantage.sh/aws/ec2/c7g.8xlarge",
|
151 |
+
"price": 1.16,
|
152 |
+
},
|
153 |
"inf2.xlarge": {
|
154 |
"cloud": "AWS",
|
155 |
"gpu": "2xNeuronCore v2",
|
results_arcee_lite.py
CHANGED
@@ -91,5 +91,27 @@ results_arcee_lite = {
|
|
91 |
},
|
92 |
],
|
93 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
94 |
],
|
95 |
}
|
|
|
91 |
},
|
92 |
],
|
93 |
},
|
94 |
+
{
|
95 |
+
"instanceType": "c7g.2xlarge",
|
96 |
+
"configurations": [
|
97 |
+
{
|
98 |
+
"container": "PyTorch 2.4.1 on EC2",
|
99 |
+
"quantization": "none",
|
100 |
+
"status": "OK",
|
101 |
+
"tokensPerSecond": "16.5",
|
102 |
+
},
|
103 |
+
],
|
104 |
+
},
|
105 |
+
{
|
106 |
+
"instanceType": "c7g.8xlarge",
|
107 |
+
"configurations": [
|
108 |
+
{
|
109 |
+
"container": "PyTorch 2.4.1 on EC2",
|
110 |
+
"quantization": "none",
|
111 |
+
"status": "OK",
|
112 |
+
"tokensPerSecond": "26",
|
113 |
+
},
|
114 |
+
],
|
115 |
+
},
|
116 |
],
|
117 |
}
|