Upload /Llama-2-7b-hf/nf4_batch_size_1_sq_len_256_new_tokens_256/benchmark_report.json with huggingface_hub
Browse files
Llama-2-7b-hf/nf4_batch_size_1_sq_len_256_new_tokens_256/benchmark_report.json
CHANGED
@@ -2,215 +2,215 @@
|
|
2 |
"prefill": {
|
3 |
"memory": {
|
4 |
"unit": "MB",
|
5 |
-
"max_ram":
|
6 |
"max_vram": 4940.890112,
|
7 |
"max_reserved": 4456.448,
|
8 |
"max_allocated": 4286.221824
|
9 |
},
|
10 |
"latency": {
|
11 |
"unit": "s",
|
12 |
-
"mean": 0.
|
13 |
-
"stdev": 0.
|
14 |
"values": [
|
15 |
-
0.
|
16 |
-
0.
|
17 |
-
0.
|
18 |
-
0.
|
19 |
-
0.
|
20 |
-
0.
|
21 |
-
0.
|
22 |
-
0.
|
23 |
-
0.
|
24 |
-
0.
|
25 |
-
0.
|
26 |
-
0.
|
27 |
-
0.
|
28 |
-
0.
|
29 |
-
0.
|
30 |
-
0.053000190734863284,
|
31 |
-
0.05276160049438477,
|
32 |
-
0.05281075286865235,
|
33 |
-
0.053375999450683595,
|
34 |
-
0.051775489807128906,
|
35 |
-
0.05146316909790039,
|
36 |
0.05167513656616211,
|
37 |
-
0.
|
38 |
-
0.
|
39 |
-
0.
|
40 |
-
0.
|
41 |
-
0.
|
42 |
-
0.
|
43 |
-
0.
|
44 |
-
0.
|
45 |
-
0.
|
46 |
-
0.
|
47 |
-
0.
|
48 |
-
0.
|
49 |
-
0.
|
50 |
-
0.
|
51 |
-
0.
|
52 |
-
0.
|
53 |
-
0.
|
54 |
-
0.
|
55 |
-
0.
|
56 |
-
0.
|
57 |
-
0.
|
58 |
-
0.
|
59 |
-
0.
|
60 |
-
0.
|
61 |
-
0.
|
62 |
-
0.
|
63 |
-
0.
|
64 |
-
0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
65 |
0.0515676155090332,
|
66 |
-
0.
|
67 |
-
0.
|
68 |
-
0.05165465545654297,
|
69 |
-
0.05150207901000976,
|
70 |
-
0.05151846313476562,
|
71 |
-
0.05116825485229492,
|
72 |
-
0.051286014556884765,
|
73 |
-
0.05153484725952148,
|
74 |
-
0.051636417388916014,
|
75 |
0.05152767944335938,
|
76 |
-
0.
|
77 |
-
0.
|
78 |
-
0.
|
79 |
-
0.
|
80 |
-
0.
|
81 |
-
0.
|
82 |
-
0.
|
83 |
-
0.
|
84 |
-
0.
|
85 |
-
0.
|
86 |
-
0.
|
87 |
-
0.
|
88 |
-
0.
|
89 |
-
0.
|
90 |
-
0.
|
91 |
-
0.
|
92 |
-
0.
|
93 |
-
0.
|
94 |
-
0.
|
95 |
-
0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
96 |
0.05161676788330078,
|
97 |
-
0.
|
98 |
-
0.
|
99 |
-
0.
|
100 |
-
0.05110681533813476,
|
101 |
-
0.05103923034667969,
|
102 |
-
0.05158707046508789,
|
103 |
-
0.051504127502441405,
|
104 |
-
0.05152153778076172,
|
105 |
-
0.05145087814331055,
|
106 |
-
0.05159219360351563,
|
107 |
-
0.05135974502563476,
|
108 |
-
0.05164646530151367,
|
109 |
-
0.05147955322265625,
|
110 |
-
0.051542015075683595,
|
111 |
-
0.051353599548339846,
|
112 |
-
0.05110476684570313,
|
113 |
-
0.051089408874511716,
|
114 |
-
0.05126358413696289,
|
115 |
-
0.05118054580688477,
|
116 |
-
0.05140070343017578,
|
117 |
-
0.05142425537109375,
|
118 |
-
0.0513177604675293,
|
119 |
-
0.051113983154296876,
|
120 |
-
0.051154945373535154,
|
121 |
-
0.05133852767944336,
|
122 |
0.05161062240600586,
|
123 |
-
0.
|
124 |
-
0.
|
125 |
-
0.
|
126 |
-
0.
|
127 |
-
0.
|
128 |
-
0.
|
129 |
-
0.
|
130 |
-
0.
|
131 |
-
0.
|
132 |
-
0.
|
133 |
-
0.
|
134 |
-
0.
|
135 |
-
0.
|
136 |
-
0.
|
137 |
-
0.
|
138 |
-
0.
|
139 |
-
0.
|
140 |
-
0.
|
141 |
-
0.
|
142 |
-
0.
|
|
|
|
|
|
|
143 |
0.05175296020507812,
|
144 |
-
0.
|
145 |
-
0.
|
146 |
-
0.
|
147 |
-
0.
|
148 |
-
0.
|
149 |
-
0.
|
150 |
-
0.
|
151 |
-
0.
|
152 |
-
0.05168025588989258,
|
153 |
-
0.051606529235839846,
|
154 |
-
0.05172326278686523,
|
155 |
-
0.051533824920654295,
|
156 |
-
0.0515676155090332,
|
157 |
-
0.0515491828918457,
|
158 |
-
0.0512911376953125,
|
159 |
-
0.051418113708496097,
|
160 |
-
0.05157888031005859,
|
161 |
-
0.0514068489074707,
|
162 |
-
0.051092479705810545,
|
163 |
-
0.05153177642822265,
|
164 |
-
0.051422206878662106,
|
165 |
-
0.051530750274658206,
|
166 |
-
0.05161574554443359,
|
167 |
-
0.05168230438232422,
|
168 |
-
0.051781631469726565,
|
169 |
-
0.051560447692871096,
|
170 |
-
0.051571712493896485,
|
171 |
-
0.051389438629150394,
|
172 |
-
0.0515860481262207,
|
173 |
-
0.051622913360595706,
|
174 |
-
0.05162188720703125,
|
175 |
-
0.05143756866455078,
|
176 |
-
0.051525630950927735,
|
177 |
0.051622913360595706,
|
178 |
-
0.
|
179 |
-
0.
|
180 |
-
0.
|
181 |
-
0.
|
182 |
-
0.
|
183 |
-
0.
|
184 |
-
0.
|
185 |
-
0.
|
186 |
-
0.
|
187 |
-
0.
|
188 |
-
0.
|
189 |
-
0.
|
190 |
-
0.
|
191 |
-
0.
|
192 |
-
0.
|
193 |
-
0.
|
194 |
-
0.
|
195 |
-
0.
|
196 |
-
0.0517314567565918,
|
197 |
-
0.051535873413085936,
|
198 |
-
0.051574783325195314,
|
199 |
-
0.05158195114135742,
|
200 |
-
0.05166592025756836,
|
201 |
-
0.05140787124633789,
|
202 |
-
0.051350528717041016,
|
203 |
-
0.0511539192199707,
|
204 |
-
0.05114470291137695,
|
205 |
-
0.05105049514770508,
|
206 |
-
0.051509246826171876,
|
207 |
-
0.05155350494384765,
|
208 |
-
0.05147347259521484
|
209 |
]
|
210 |
},
|
211 |
"throughput": {
|
212 |
"unit": "tokens/s",
|
213 |
-
"value":
|
214 |
},
|
215 |
"energy": null,
|
216 |
"efficiency": null
|
@@ -218,22 +218,22 @@
|
|
218 |
"decode": {
|
219 |
"memory": {
|
220 |
"unit": "MB",
|
221 |
-
"max_ram":
|
222 |
"max_vram": 5314.183168,
|
223 |
"max_reserved": 4829.741056,
|
224 |
"max_allocated": 4749.821952
|
225 |
},
|
226 |
"latency": {
|
227 |
"unit": "s",
|
228 |
-
"mean": 10.
|
229 |
"stdev": 0,
|
230 |
"values": [
|
231 |
-
10.
|
232 |
]
|
233 |
},
|
234 |
"throughput": {
|
235 |
"unit": "tokens/s",
|
236 |
-
"value":
|
237 |
},
|
238 |
"energy": null,
|
239 |
"efficiency": null
|
@@ -242,269 +242,269 @@
|
|
242 |
"memory": null,
|
243 |
"latency": {
|
244 |
"unit": "s",
|
245 |
-
"mean": 0.
|
246 |
-
"stdev": 0.
|
247 |
"values": [
|
248 |
-
0.
|
249 |
-
0.
|
250 |
-
0.
|
251 |
-
0.
|
252 |
-
0.
|
253 |
-
0.
|
254 |
-
0.
|
255 |
-
0.
|
256 |
-
0.
|
257 |
-
0.
|
258 |
-
0.
|
259 |
-
0.
|
260 |
-
0.
|
261 |
-
0.
|
262 |
-
0.
|
263 |
-
0.
|
264 |
-
0.
|
265 |
-
0.
|
266 |
-
0.
|
267 |
-
0.
|
268 |
-
0.
|
269 |
-
0.
|
270 |
-
0.
|
271 |
-
0.
|
272 |
-
0.
|
273 |
-
0.
|
274 |
-
0.
|
275 |
-
0.
|
276 |
-
0.
|
277 |
-
0.
|
278 |
-
0.
|
279 |
-
0.
|
280 |
-
0.
|
281 |
-
0.
|
|
|
|
|
|
|
|
|
|
|
282 |
0.04153241729736328,
|
283 |
-
0.
|
284 |
-
0.
|
285 |
-
0.
|
286 |
-
0.
|
287 |
-
0.
|
288 |
-
0.
|
289 |
-
0.
|
290 |
-
0.04181708908081055,
|
291 |
-
0.04179267120361328,
|
292 |
-
0.04171260833740234,
|
293 |
-
0.04174937438964844,
|
294 |
-
0.041616382598876955,
|
295 |
-
0.041829376220703124,
|
296 |
-
0.041603073120117184,
|
297 |
-
0.041717758178710936,
|
298 |
-
0.04151500701904297,
|
299 |
-
0.041731071472167966,
|
300 |
0.041608192443847655,
|
301 |
-
0.
|
302 |
-
0.
|
303 |
-
0.
|
304 |
-
0.
|
305 |
-
0.
|
306 |
-
0.
|
307 |
-
0.
|
308 |
-
0.041524223327636715,
|
309 |
-
0.04168601608276367,
|
310 |
-
0.041593120574951174,
|
311 |
-
0.041797344207763674,
|
312 |
-
0.04171571350097656,
|
313 |
-
0.041632766723632815,
|
314 |
-
0.041614334106445314,
|
315 |
-
0.041626625061035157,
|
316 |
-
0.04193689727783203,
|
317 |
-
0.04165017700195312,
|
318 |
-
0.04174028778076172,
|
319 |
-
0.04172403335571289,
|
320 |
-
0.04162547302246094,
|
321 |
-
0.04185712051391602,
|
322 |
-
0.04182316970825195,
|
323 |
-
0.04184675216674805,
|
324 |
-
0.04163481521606445,
|
325 |
-
0.041601184844970704,
|
326 |
-
0.041738079071044924,
|
327 |
-
0.04175475311279297,
|
328 |
-
0.041651073455810546,
|
329 |
-
0.04153753662109375,
|
330 |
-
0.04159590530395508,
|
331 |
-
0.04167782211303711,
|
332 |
-
0.04157132720947266,
|
333 |
-
0.04167081451416016,
|
334 |
-
0.04192240142822266,
|
335 |
-
0.041847808837890625,
|
336 |
-
0.0417781753540039,
|
337 |
-
0.041589759826660154,
|
338 |
-
0.04146380615234375,
|
339 |
0.04161740875244141,
|
340 |
-
0.
|
341 |
-
0.
|
342 |
-
0.
|
343 |
-
0.
|
344 |
-
0.
|
345 |
-
0.
|
346 |
-
0.
|
347 |
-
0.
|
348 |
-
0.
|
349 |
-
0.
|
350 |
-
0.
|
351 |
-
0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
352 |
0.04157235336303711,
|
353 |
-
0.
|
354 |
-
0.
|
355 |
-
0.
|
356 |
-
0.
|
357 |
-
0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
358 |
0.04149657440185547,
|
359 |
-
0.
|
360 |
-
0.
|
361 |
-
0.
|
362 |
-
0.
|
363 |
-
0.0417465934753418,
|
364 |
-
0.041484127044677736,
|
365 |
-
0.041576446533203124,
|
366 |
-
0.04166451263427735,
|
367 |
-
0.04152012634277344,
|
368 |
-
0.04155084609985352,
|
369 |
-
0.04184796905517578,
|
370 |
-
0.041730110168457034,
|
371 |
-
0.04171241760253906,
|
372 |
-
0.04195942306518555,
|
373 |
-
0.04180086517333984,
|
374 |
-
0.041860958099365235,
|
375 |
-
0.04213862228393555,
|
376 |
-
0.041812992095947264,
|
377 |
-
0.04155295944213867,
|
378 |
-
0.04158047866821289,
|
379 |
-
0.04168601608276367,
|
380 |
-
0.041646080017089845,
|
381 |
-
0.04159414291381836,
|
382 |
-
0.0416734390258789,
|
383 |
-
0.041470977783203126,
|
384 |
-
0.04157440185546875,
|
385 |
-
0.0416993293762207,
|
386 |
-
0.041603073120117184,
|
387 |
-
0.04145459365844727,
|
388 |
-
0.04195840072631836,
|
389 |
-
0.04162169647216797,
|
390 |
-
0.04170630264282227,
|
391 |
-
0.041556991577148435,
|
392 |
-
0.04160102462768555,
|
393 |
-
0.04152115249633789,
|
394 |
-
0.0416071662902832,
|
395 |
-
0.041560062408447264,
|
396 |
-
0.04177519989013672,
|
397 |
-
0.041548702239990236,
|
398 |
-
0.04153958511352539,
|
399 |
-
0.04204851150512695,
|
400 |
-
0.041673728942871094,
|
401 |
-
0.04154163360595703,
|
402 |
0.04151398468017578,
|
403 |
-
0.
|
404 |
-
0.
|
405 |
-
0.
|
406 |
-
0.
|
407 |
-
0.04147711944580078,
|
408 |
-
0.04153958511352539,
|
409 |
-
0.041490432739257815,
|
410 |
-
0.0418600959777832,
|
411 |
-
0.04146995162963867,
|
412 |
-
0.04177519989013672,
|
413 |
-
0.04163593673706055,
|
414 |
-
0.04164281463623047,
|
415 |
-
0.04151603317260742,
|
416 |
-
0.04149350357055664,
|
417 |
-
0.04160102462768555,
|
418 |
-
0.04163481521606445,
|
419 |
-
0.042264575958251956,
|
420 |
-
0.041559040069580076,
|
421 |
-
0.041662689208984374,
|
422 |
-
0.04177590560913086,
|
423 |
0.04161740875244141,
|
|
|
|
|
|
|
|
|
|
|
424 |
0.04158156967163086,
|
425 |
-
0.
|
426 |
-
0.
|
427 |
-
0.
|
428 |
-
0.
|
429 |
-
0.
|
430 |
-
0.
|
431 |
-
0.
|
432 |
-
0.
|
433 |
-
0.
|
434 |
-
0.
|
435 |
-
0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
436 |
0.04147609710693359,
|
437 |
-
0.
|
438 |
-
0.
|
439 |
-
0.
|
440 |
-
0.
|
441 |
-
0.
|
442 |
-
0.04158153533935547,
|
443 |
-
0.042003456115722655,
|
444 |
-
0.0416861457824707,
|
445 |
-
0.04159183883666992,
|
446 |
-
0.041616222381591794,
|
447 |
-
0.04163993453979492,
|
448 |
-
0.04178432083129883,
|
449 |
-
0.04165119934082031,
|
450 |
-
0.0417628173828125,
|
451 |
-
0.041796607971191405,
|
452 |
-
0.04151603317260742,
|
453 |
-
0.041546817779541015,
|
454 |
-
0.04167776107788086,
|
455 |
-
0.04168601608276367,
|
456 |
-
0.041657344818115234,
|
457 |
-
0.0416923828125,
|
458 |
-
0.04163459014892578,
|
459 |
-
0.04161536026000977,
|
460 |
-
0.041619457244873044,
|
461 |
-
0.04166057586669922,
|
462 |
-
0.041583454132080075,
|
463 |
-
0.042014720916748044,
|
464 |
-
0.041640960693359375,
|
465 |
-
0.041836544036865236,
|
466 |
-
0.04171571350097656,
|
467 |
-
0.041724929809570314,
|
468 |
-
0.04170137786865234,
|
469 |
-
0.041708545684814455,
|
470 |
-
0.04186521530151367,
|
471 |
-
0.041589759826660154,
|
472 |
-
0.0416102409362793,
|
473 |
-
0.04151295852661133,
|
474 |
-
0.041506816864013675,
|
475 |
-
0.04159897613525391,
|
476 |
-
0.04149657440185547,
|
477 |
-
0.04168499374389648,
|
478 |
-
0.041540607452392575,
|
479 |
-
0.04151603317260742,
|
480 |
-
0.041826305389404295,
|
481 |
-
0.041657344818115234,
|
482 |
-
0.0416102409362793,
|
483 |
0.04163993453979492,
|
484 |
-
0.
|
485 |
-
0.
|
486 |
-
0.
|
487 |
-
0.
|
488 |
-
0.
|
489 |
-
0.
|
490 |
-
0.
|
491 |
-
0.
|
492 |
-
0.
|
493 |
-
0.
|
494 |
-
0.
|
495 |
-
0.
|
496 |
-
0.
|
497 |
-
0.
|
498 |
-
0.
|
499 |
-
0.
|
500 |
-
0.
|
501 |
-
0.
|
502 |
-
0.
|
|
|
|
|
|
|
503 |
]
|
504 |
},
|
505 |
"throughput": {
|
506 |
"unit": "tokens/s",
|
507 |
-
"value":
|
508 |
},
|
509 |
"energy": null,
|
510 |
"efficiency": null
|
|
|
2 |
"prefill": {
|
3 |
"memory": {
|
4 |
"unit": "MB",
|
5 |
+
"max_ram": 1028.804608,
|
6 |
"max_vram": 4940.890112,
|
7 |
"max_reserved": 4456.448,
|
8 |
"max_allocated": 4286.221824
|
9 |
},
|
10 |
"latency": {
|
11 |
"unit": "s",
|
12 |
+
"mean": 0.05170404202176124,
|
13 |
+
"stdev": 0.0002913311874566411,
|
14 |
"values": [
|
15 |
+
0.05474662399291992,
|
16 |
+
0.05249331283569336,
|
17 |
+
0.0521082878112793,
|
18 |
+
0.05223238372802735,
|
19 |
+
0.05216255950927735,
|
20 |
+
0.05239807891845703,
|
21 |
+
0.052034561157226565,
|
22 |
+
0.05223628616333008,
|
23 |
+
0.052259838104248044,
|
24 |
+
0.05230182266235352,
|
25 |
+
0.0523059196472168,
|
26 |
+
0.0518809585571289,
|
27 |
+
0.05163315200805664,
|
28 |
+
0.05170687866210937,
|
29 |
+
0.05161574554443359,
|
|
|
|
|
|
|
|
|
|
|
|
|
30 |
0.05167513656616211,
|
31 |
+
0.05212979125976563,
|
32 |
+
0.05194342422485351,
|
33 |
+
0.05171712112426758,
|
34 |
+
0.05173657608032227,
|
35 |
+
0.05156777572631836,
|
36 |
+
0.0516640625,
|
37 |
+
0.051748863220214845,
|
38 |
+
0.05178879928588867,
|
39 |
+
0.05161062240600586,
|
40 |
+
0.05174272155761719,
|
41 |
+
0.05163113784790039,
|
42 |
+
0.05164748764038086,
|
43 |
+
0.05156454467773437,
|
44 |
+
0.05157791900634766,
|
45 |
+
0.05141708755493164,
|
46 |
+
0.051490943908691404,
|
47 |
+
0.05137100982666016,
|
48 |
+
0.0516864013671875,
|
49 |
+
0.05160243225097656,
|
50 |
+
0.051738624572753904,
|
51 |
+
0.051999744415283204,
|
52 |
+
0.051783679962158206,
|
53 |
+
0.051481601715087894,
|
54 |
+
0.05161062240600586,
|
55 |
+
0.051520511627197264,
|
56 |
+
0.05166592025756836,
|
57 |
+
0.051547134399414066,
|
58 |
+
0.05160857772827149,
|
59 |
+
0.0514785270690918,
|
60 |
+
0.05148672103881836,
|
61 |
+
0.05153177642822265,
|
62 |
+
0.05165055847167969,
|
63 |
+
0.05150515365600586,
|
64 |
+
0.05148876953125,
|
65 |
+
0.05164569473266602,
|
66 |
+
0.05170278549194336,
|
67 |
+
0.051604480743408204,
|
68 |
+
0.05159833526611328,
|
69 |
+
0.051568641662597656,
|
70 |
+
0.05163417434692383,
|
71 |
+
0.05162598419189453,
|
72 |
+
0.05165363311767578,
|
73 |
+
0.05160243225097656,
|
74 |
+
0.05159628677368164,
|
75 |
+
0.052029441833496094,
|
76 |
+
0.05173350524902344,
|
77 |
+
0.05187686538696289,
|
78 |
+
0.05168844985961914,
|
79 |
+
0.05183590316772461,
|
80 |
+
0.051697696685791016,
|
81 |
+
0.051716094970703126,
|
82 |
+
0.05158092880249023,
|
83 |
+
0.05147750473022461,
|
84 |
+
0.051664894104003906,
|
85 |
+
0.05157580947875977,
|
86 |
+
0.05148876953125,
|
87 |
+
0.051485889434814455,
|
88 |
+
0.051588096618652345,
|
89 |
0.0515676155090332,
|
90 |
+
0.05146419143676758,
|
91 |
+
0.05151641464233398,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
92 |
0.05152767944335938,
|
93 |
+
0.05159833526611328,
|
94 |
+
0.051465217590332034,
|
95 |
+
0.05142015838623047,
|
96 |
+
0.05143756866455078,
|
97 |
+
0.05128396987915039,
|
98 |
+
0.051454975128173826,
|
99 |
+
0.05168230438232422,
|
100 |
+
0.05155635070800781,
|
101 |
+
0.05148672103881836,
|
102 |
+
0.051555328369140625,
|
103 |
+
0.051607551574707033,
|
104 |
+
0.05154816055297851,
|
105 |
+
0.051509246826171876,
|
106 |
+
0.05170995330810547,
|
107 |
+
0.05150822448730469,
|
108 |
+
0.05158399963378906,
|
109 |
+
0.05162396621704102,
|
110 |
+
0.05163417434692383,
|
111 |
+
0.051630271911621096,
|
112 |
+
0.051637248992919924,
|
113 |
+
0.051507198333740234,
|
114 |
+
0.05139251327514648,
|
115 |
+
0.05223427200317383,
|
116 |
+
0.05161164855957031,
|
117 |
+
0.05165670394897461,
|
118 |
+
0.05176627349853516,
|
119 |
+
0.05170687866210937,
|
120 |
+
0.051694591522216796,
|
121 |
+
0.051681278228759765,
|
122 |
+
0.05163827133178711,
|
123 |
+
0.05157785415649414,
|
124 |
+
0.05177446365356445,
|
125 |
+
0.051590335845947265,
|
126 |
+
0.05158399963378906,
|
127 |
+
0.051609790802001954,
|
128 |
+
0.05170380783081055,
|
129 |
+
0.05162496185302735,
|
130 |
+
0.05159430313110352,
|
131 |
+
0.05165167999267578,
|
132 |
+
0.051708927154541014,
|
133 |
+
0.05170073699951172,
|
134 |
+
0.05180108642578125,
|
135 |
+
0.05187801742553711,
|
136 |
+
0.05182160186767578,
|
137 |
+
0.051748863220214845,
|
138 |
+
0.051789825439453124,
|
139 |
+
0.05173350524902344,
|
140 |
+
0.051783679962158206,
|
141 |
+
0.05178060913085938,
|
142 |
+
0.051724288940429686,
|
143 |
+
0.05212876892089844,
|
144 |
+
0.05194342422485351,
|
145 |
+
0.0517918701171875,
|
146 |
+
0.05176934432983398,
|
147 |
+
0.051751937866210934,
|
148 |
+
0.05177241516113281,
|
149 |
+
0.05167411041259766,
|
150 |
+
0.05182668685913086,
|
151 |
+
0.05158195114135742,
|
152 |
+
0.05170393753051758,
|
153 |
0.05161676788330078,
|
154 |
+
0.05174272155761719,
|
155 |
+
0.051664894104003906,
|
156 |
+
0.051720352172851564,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
157 |
0.05161062240600586,
|
158 |
+
0.051676319122314456,
|
159 |
+
0.051555328369140625,
|
160 |
+
0.05170483016967774,
|
161 |
+
0.05160243225097656,
|
162 |
+
0.05161676788330078,
|
163 |
+
0.05199359893798828,
|
164 |
+
0.05179904174804688,
|
165 |
+
0.05155430221557617,
|
166 |
+
0.05167718505859375,
|
167 |
+
0.05153792190551758,
|
168 |
+
0.05167513656616211,
|
169 |
+
0.05177967834472656,
|
170 |
+
0.0518043212890625,
|
171 |
+
0.051678207397460936,
|
172 |
+
0.05164134216308594,
|
173 |
+
0.051716094970703126,
|
174 |
+
0.051778560638427736,
|
175 |
+
0.051678207397460936,
|
176 |
+
0.05180006408691406,
|
177 |
+
0.05164543914794922,
|
178 |
+
0.051699710845947267,
|
179 |
+
0.05167718505859375,
|
180 |
+
0.051492862701416016,
|
181 |
0.05175296020507812,
|
182 |
+
0.05163417434692383,
|
183 |
+
0.051490814208984374,
|
184 |
+
0.05177958297729492,
|
185 |
+
0.051591167449951174,
|
186 |
+
0.05171712112426758,
|
187 |
+
0.05205811309814453,
|
188 |
+
0.05183590316772461,
|
189 |
+
0.05155942535400391,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
190 |
0.051622913360595706,
|
191 |
+
0.05161881637573242,
|
192 |
+
0.05156249618530274,
|
193 |
+
0.051490814208984374,
|
194 |
+
0.05158707046508789,
|
195 |
+
0.05153996658325195,
|
196 |
+
0.05140582275390625,
|
197 |
+
0.05149798583984375,
|
198 |
+
0.051627006530761715,
|
199 |
+
0.05169356918334961,
|
200 |
+
0.05175603103637695,
|
201 |
+
0.05152767944335938,
|
202 |
+
0.05167923355102539,
|
203 |
+
0.05166694259643555,
|
204 |
+
0.05178777694702148,
|
205 |
+
0.05167923355102539,
|
206 |
+
0.05167103958129883,
|
207 |
+
0.05163827133178711,
|
208 |
+
0.051745792388916016
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
209 |
]
|
210 |
},
|
211 |
"throughput": {
|
212 |
"unit": "tokens/s",
|
213 |
+
"value": 4951.257000221656
|
214 |
},
|
215 |
"energy": null,
|
216 |
"efficiency": null
|
|
|
218 |
"decode": {
|
219 |
"memory": {
|
220 |
"unit": "MB",
|
221 |
+
"max_ram": 1049.776128,
|
222 |
"max_vram": 5314.183168,
|
223 |
"max_reserved": 4829.741056,
|
224 |
"max_allocated": 4749.821952
|
225 |
},
|
226 |
"latency": {
|
227 |
"unit": "s",
|
228 |
+
"mean": 10.574656513214116,
|
229 |
"stdev": 0,
|
230 |
"values": [
|
231 |
+
10.574656513214116
|
232 |
]
|
233 |
},
|
234 |
"throughput": {
|
235 |
"unit": "tokens/s",
|
236 |
+
"value": 24.114258433014008
|
237 |
},
|
238 |
"energy": null,
|
239 |
"efficiency": null
|
|
|
242 |
"memory": null,
|
243 |
"latency": {
|
244 |
"unit": "s",
|
245 |
+
"mean": 0.04146924122829065,
|
246 |
+
"stdev": 0.00017074772409957268,
|
247 |
"values": [
|
248 |
+
0.04150476837158203,
|
249 |
+
0.042403839111328126,
|
250 |
+
0.041670654296875,
|
251 |
+
0.041546817779541015,
|
252 |
+
0.041508800506591795,
|
253 |
+
0.042191871643066405,
|
254 |
+
0.041529342651367186,
|
255 |
+
0.041586688995361325,
|
256 |
+
0.041390079498291016,
|
257 |
+
0.041543678283691404,
|
258 |
+
0.04146790313720703,
|
259 |
+
0.04157132720947266,
|
260 |
+
0.04135321426391601,
|
261 |
+
0.04207820892333984,
|
262 |
+
0.0416255989074707,
|
263 |
+
0.04173721694946289,
|
264 |
+
0.041444351196289066,
|
265 |
+
0.041559040069580076,
|
266 |
+
0.041573375701904294,
|
267 |
+
0.041681919097900394,
|
268 |
+
0.04148428726196289,
|
269 |
+
0.04157440185546875,
|
270 |
+
0.041488384246826174,
|
271 |
+
0.041543678283691404,
|
272 |
+
0.041390079498291016,
|
273 |
+
0.041570335388183596,
|
274 |
+
0.04142076873779297,
|
275 |
+
0.041436161041259766,
|
276 |
+
0.04136140823364258,
|
277 |
+
0.04148735809326172,
|
278 |
+
0.041488384246826174,
|
279 |
+
0.04146278381347656,
|
280 |
+
0.041289726257324216,
|
281 |
+
0.041427967071533206,
|
282 |
+
0.04124671936035156,
|
283 |
+
0.041312255859375,
|
284 |
+
0.04126310348510742,
|
285 |
+
0.04131532669067383,
|
286 |
+
0.041750526428222655,
|
287 |
0.04153241729736328,
|
288 |
+
0.04132556915283203,
|
289 |
+
0.04212736129760742,
|
290 |
+
0.041588737487792966,
|
291 |
+
0.04150067138671875,
|
292 |
+
0.04154777526855469,
|
293 |
+
0.041559040069580076,
|
294 |
+
0.041442302703857424,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
295 |
0.041608192443847655,
|
296 |
+
0.04143513488769531,
|
297 |
+
0.04149760055541992,
|
298 |
+
0.04132044982910156,
|
299 |
+
0.0413941764831543,
|
300 |
+
0.04140544128417969,
|
301 |
+
0.04152012634277344,
|
302 |
+
0.041414657592773435,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
303 |
0.04161740875244141,
|
304 |
+
0.04153036880493164,
|
305 |
+
0.041518081665039064,
|
306 |
+
0.04139212799072266,
|
307 |
+
0.04147507095336914,
|
308 |
+
0.04136243057250977,
|
309 |
+
0.041524223327636715,
|
310 |
+
0.04139622497558594,
|
311 |
+
0.04150374221801758,
|
312 |
+
0.04150067138671875,
|
313 |
+
0.04148633575439453,
|
314 |
+
0.04196147155761719,
|
315 |
+
0.041635841369628904,
|
316 |
+
0.04150476837158203,
|
317 |
+
0.04139519882202149,
|
318 |
+
0.04140544128417969,
|
319 |
+
0.041545726776123046,
|
320 |
+
0.04131020736694336,
|
321 |
+
0.04139622497558594,
|
322 |
+
0.041296897888183595,
|
323 |
+
0.041404415130615234,
|
324 |
+
0.04141484832763672,
|
325 |
+
0.041215808868408206,
|
326 |
+
0.04135116958618164,
|
327 |
+
0.04145459365844727,
|
328 |
+
0.0414832649230957,
|
329 |
0.04157235336303711,
|
330 |
+
0.041534465789794923,
|
331 |
+
0.04132863998413086,
|
332 |
+
0.04141875076293945,
|
333 |
+
0.04150067138671875,
|
334 |
+
0.04132761764526367,
|
335 |
+
0.04156927871704102,
|
336 |
+
0.04131123352050781,
|
337 |
+
0.04123648071289063,
|
338 |
+
0.04149862289428711,
|
339 |
+
0.04136243057250977,
|
340 |
+
0.04140544128417969,
|
341 |
+
0.042194942474365234,
|
342 |
+
0.04163891220092773,
|
343 |
+
0.04163071823120117,
|
344 |
+
0.04144537734985351,
|
345 |
+
0.041460735321044925,
|
346 |
+
0.04140544128417969,
|
347 |
0.04149657440185547,
|
348 |
+
0.041442302703857424,
|
349 |
+
0.04144537734985351,
|
350 |
+
0.04136959838867187,
|
351 |
+
0.0414730224609375,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
352 |
0.04151398468017578,
|
353 |
+
0.04151500701904297,
|
354 |
+
0.041534465789794923,
|
355 |
+
0.041384960174560545,
|
356 |
+
0.04180275344848633,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
357 |
0.04161740875244141,
|
358 |
+
0.04157132720947266,
|
359 |
+
0.04156108856201172,
|
360 |
+
0.04146278381347656,
|
361 |
+
0.04144844818115234,
|
362 |
+
0.041681919097900394,
|
363 |
0.04158156967163086,
|
364 |
+
0.04139519882202149,
|
365 |
+
0.04136345672607422,
|
366 |
+
0.04143308639526367,
|
367 |
+
0.04142489624023438,
|
368 |
+
0.04138086318969727,
|
369 |
+
0.04141875076293945,
|
370 |
+
0.041414657592773435,
|
371 |
+
0.04136243057250977,
|
372 |
+
0.04142489624023438,
|
373 |
+
0.04132966232299805,
|
374 |
+
0.041417728424072264,
|
375 |
+
0.04213248062133789,
|
376 |
+
0.04153958511352539,
|
377 |
+
0.04153958511352539,
|
378 |
+
0.04146380615234375,
|
379 |
+
0.04155289459228516,
|
380 |
+
0.04136447906494141,
|
381 |
+
0.04137267303466797,
|
382 |
+
0.041371646881103515,
|
383 |
+
0.041490432739257815,
|
384 |
+
0.04129587173461914,
|
385 |
+
0.04142694473266602,
|
386 |
+
0.04146176147460937,
|
387 |
+
0.04146380615234375,
|
388 |
+
0.04147507095336914,
|
389 |
+
0.04144332885742188,
|
390 |
+
0.041468929290771485,
|
391 |
+
0.04137472152709961,
|
392 |
+
0.04138905715942383,
|
393 |
+
0.04131123352050781,
|
394 |
+
0.04135833740234375,
|
395 |
+
0.041316352844238284,
|
396 |
+
0.04177510452270508,
|
397 |
+
0.04144537734985351,
|
398 |
+
0.04154163360595703,
|
399 |
+
0.04183552169799805,
|
400 |
+
0.04143001556396484,
|
401 |
+
0.041417728424072264,
|
402 |
+
0.04133171081542969,
|
403 |
+
0.0414648323059082,
|
404 |
+
0.0415098876953125,
|
405 |
+
0.04138086318969727,
|
406 |
+
0.041474048614501956,
|
407 |
+
0.041289726257324216,
|
408 |
+
0.041376766204833985,
|
409 |
+
0.04139724731445313,
|
410 |
+
0.04148019027709961,
|
411 |
+
0.04131532669067383,
|
412 |
+
0.04135935974121094,
|
413 |
+
0.04131020736694336,
|
414 |
+
0.04136345672607422,
|
415 |
+
0.04132044982910156,
|
416 |
+
0.04127129745483398,
|
417 |
+
0.04123648071289063,
|
418 |
+
0.041319423675537106,
|
419 |
+
0.042106880187988284,
|
420 |
+
0.041452545166015625,
|
421 |
+
0.04160409545898437,
|
422 |
+
0.0414463996887207,
|
423 |
+
0.041425918579101564,
|
424 |
+
0.04141363143920898,
|
425 |
+
0.041594879150390625,
|
426 |
+
0.041491455078125,
|
427 |
+
0.04127231979370117,
|
428 |
+
0.04136447906494141,
|
429 |
+
0.0414730224609375,
|
430 |
+
0.04146278381347656,
|
431 |
+
0.04133171081542969,
|
432 |
+
0.041278465270996094,
|
433 |
+
0.04126924896240235,
|
434 |
+
0.041398273468017575,
|
435 |
+
0.04142489624023438,
|
436 |
+
0.041355262756347655,
|
437 |
+
0.04139519882202149,
|
438 |
+
0.041470977783203126,
|
439 |
+
0.04130201721191406,
|
440 |
+
0.0414648323059082,
|
441 |
+
0.04188774490356445,
|
442 |
+
0.04142899322509765,
|
443 |
+
0.04134400177001953,
|
444 |
+
0.04126617431640625,
|
445 |
+
0.04130099105834961,
|
446 |
+
0.0413829116821289,
|
447 |
+
0.04145151901245117,
|
448 |
+
0.04148223876953125,
|
449 |
+
0.04157030487060547,
|
450 |
+
0.04130713653564453,
|
451 |
+
0.04139929580688476,
|
452 |
+
0.04117913436889648,
|
453 |
+
0.04145459365844727,
|
454 |
+
0.04136959838867187,
|
455 |
+
0.041431041717529295,
|
456 |
+
0.04142489624023438,
|
457 |
+
0.041336830139160154,
|
458 |
+
0.041388031005859374,
|
459 |
+
0.04127231979370117,
|
460 |
+
0.04135116958618164,
|
461 |
+
0.04148121643066406,
|
462 |
+
0.04142182540893555,
|
463 |
+
0.04147814559936523,
|
464 |
+
0.04150067138671875,
|
465 |
+
0.04145459365844727,
|
466 |
+
0.041457664489746096,
|
467 |
+
0.04138393783569336,
|
468 |
+
0.04140031814575195,
|
469 |
+
0.042016769409179686,
|
470 |
+
0.0415549430847168,
|
471 |
+
0.04157440185546875,
|
472 |
+
0.04136038589477539,
|
473 |
+
0.04165529632568359,
|
474 |
0.04147609710693359,
|
475 |
+
0.041447425842285154,
|
476 |
+
0.04145459365844727,
|
477 |
+
0.041441280364990236,
|
478 |
+
0.04125286483764649,
|
479 |
+
0.04126617431640625,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
480 |
0.04163993453979492,
|
481 |
+
0.041490432739257815,
|
482 |
+
0.04153139114379883,
|
483 |
+
0.04145663833618164,
|
484 |
+
0.04133375930786133,
|
485 |
+
0.04145663833618164,
|
486 |
+
0.04137062454223633,
|
487 |
+
0.04146176147460937,
|
488 |
+
0.04140544128417969,
|
489 |
+
0.04143513488769531,
|
490 |
+
0.041425918579101564,
|
491 |
+
0.041306110382080076,
|
492 |
+
0.041417728424072264,
|
493 |
+
0.041401344299316405,
|
494 |
+
0.04133785629272461,
|
495 |
+
0.041524223327636715,
|
496 |
+
0.04125798416137695,
|
497 |
+
0.041411582946777346,
|
498 |
+
0.04127743911743164,
|
499 |
+
0.04143206405639648,
|
500 |
+
0.04170342254638672,
|
501 |
+
0.04133375930786133,
|
502 |
+
0.04138393783569336
|
503 |
]
|
504 |
},
|
505 |
"throughput": {
|
506 |
"unit": "tokens/s",
|
507 |
+
"value": 24.114258433014008
|
508 |
},
|
509 |
"energy": null,
|
510 |
"efficiency": null
|