kreas commited on
Commit
0282f24
1 Parent(s): de95916

Upload /Llama-2-7b-hf/fp16_batch_size_1_sq_len_256_new_tokens_256/benchmark_report.json with huggingface_hub

Browse files
Llama-2-7b-hf/fp16_batch_size_1_sq_len_256_new_tokens_256/benchmark_report.json ADDED
@@ -0,0 +1,319 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "prefill": {
3
+ "memory": {
4
+ "unit": "MB",
5
+ "max_ram": 14428.340224,
6
+ "max_vram": null,
7
+ "max_reserved": null,
8
+ "max_allocated": null
9
+ },
10
+ "latency": {
11
+ "unit": "s",
12
+ "mean": 721.865740631707,
13
+ "stdev": 0,
14
+ "values": [
15
+ 721.865740631707
16
+ ]
17
+ },
18
+ "throughput": {
19
+ "unit": "tokens/s",
20
+ "value": 0.3546365834953929
21
+ },
22
+ "energy": null,
23
+ "efficiency": null
24
+ },
25
+ "decode": {
26
+ "memory": {
27
+ "unit": "MB",
28
+ "max_ram": 15008.575488,
29
+ "max_vram": null,
30
+ "max_reserved": null,
31
+ "max_allocated": null
32
+ },
33
+ "latency": {
34
+ "unit": "s",
35
+ "mean": 734.3304695356637,
36
+ "stdev": 0,
37
+ "values": [
38
+ 734.3304695356637
39
+ ]
40
+ },
41
+ "throughput": {
42
+ "unit": "tokens/s",
43
+ "value": 0.34725509913982344
44
+ },
45
+ "energy": null,
46
+ "efficiency": null
47
+ },
48
+ "per_token": {
49
+ "memory": null,
50
+ "latency": {
51
+ "unit": "s",
52
+ "mean": 2.879727331512407,
53
+ "stdev": 0.04107362200585789,
54
+ "values": [
55
+ 2.9385468643158674,
56
+ 2.9143700106069446,
57
+ 2.843031763099134,
58
+ 2.822499616071582,
59
+ 2.8212424432858825,
60
+ 2.8061846420168877,
61
+ 2.82673567160964,
62
+ 2.817688633687794,
63
+ 2.8218574644997716,
64
+ 2.8257429832592607,
65
+ 2.8300879187881947,
66
+ 2.8612214317545295,
67
+ 2.829491440206766,
68
+ 2.846251167356968,
69
+ 2.8254850264638662,
70
+ 2.8359292401000857,
71
+ 2.8186050839722157,
72
+ 2.818417158909142,
73
+ 2.828051752410829,
74
+ 2.8666542265564203,
75
+ 2.8268470177426934,
76
+ 2.839160805568099,
77
+ 2.8177184406667948,
78
+ 2.8367137350142,
79
+ 2.8362368857488036,
80
+ 2.8165336698293686,
81
+ 2.842088329605758,
82
+ 2.8467939561232924,
83
+ 2.841556423343718,
84
+ 2.8277707025408745,
85
+ 2.8284124936908484,
86
+ 2.8474630704149604,
87
+ 2.857991522178054,
88
+ 2.835691520012915,
89
+ 2.854499421082437,
90
+ 2.8340786742046475,
91
+ 2.836664179340005,
92
+ 2.824924842454493,
93
+ 2.8405343275517225,
94
+ 2.8246167171746492,
95
+ 2.842505213804543,
96
+ 2.8432223042473197,
97
+ 2.8442600509151816,
98
+ 2.8238972732797265,
99
+ 2.860867719165981,
100
+ 2.8718524603173137,
101
+ 2.8733268408104777,
102
+ 2.836213171482086,
103
+ 2.856795210391283,
104
+ 2.8363574109971523,
105
+ 2.8353463020175695,
106
+ 2.85314810462296,
107
+ 2.835397214628756,
108
+ 2.8340443912893534,
109
+ 2.862760554999113,
110
+ 2.895379811525345,
111
+ 2.82875822391361,
112
+ 2.8349446933716536,
113
+ 2.8385312892496586,
114
+ 2.833289047703147,
115
+ 2.8392162285745144,
116
+ 2.839728854596615,
117
+ 2.8417117930948734,
118
+ 2.835888074710965,
119
+ 2.8375091338530183,
120
+ 2.834161284379661,
121
+ 2.8324432419613004,
122
+ 2.842374537140131,
123
+ 2.8284934889525175,
124
+ 2.835274930112064,
125
+ 2.8297918746247888,
126
+ 2.829239242710173,
127
+ 2.8231541300192475,
128
+ 2.8253626748919487,
129
+ 2.824960014782846,
130
+ 2.8855868177488446,
131
+ 2.9172188816592097,
132
+ 2.8618392841890454,
133
+ 2.8641830645501614,
134
+ 2.8437582114711404,
135
+ 2.8409676663577557,
136
+ 2.8402419853955507,
137
+ 2.8413416389375925,
138
+ 2.8751571010798216,
139
+ 2.8406030628830194,
140
+ 2.849424152635038,
141
+ 2.8573353057727218,
142
+ 2.8517128182575107,
143
+ 2.864315642043948,
144
+ 2.8824369478970766,
145
+ 2.89484746940434,
146
+ 2.8697338197380304,
147
+ 2.9378398340195417,
148
+ 2.9669651770964265,
149
+ 2.9125292915850878,
150
+ 2.8827766915783286,
151
+ 2.919279803521931,
152
+ 2.925505558028817,
153
+ 2.971466583199799,
154
+ 2.976382707245648,
155
+ 2.9475440494716167,
156
+ 2.9559828294441104,
157
+ 2.9283662689849734,
158
+ 2.957946610637009,
159
+ 2.9487025309354067,
160
+ 2.9593161530792713,
161
+ 2.9574743369594216,
162
+ 2.9551591286435723,
163
+ 2.9535121098160744,
164
+ 2.9389448668807745,
165
+ 2.934167162515223,
166
+ 2.8967571863904595,
167
+ 2.8870894983410835,
168
+ 2.8904988281428814,
169
+ 2.8709027180448174,
170
+ 2.8767099333927035,
171
+ 2.8932711351662874,
172
+ 2.9428761349990964,
173
+ 2.928292591124773,
174
+ 2.8747380282729864,
175
+ 2.9095580661669374,
176
+ 2.956421473994851,
177
+ 2.94635031465441,
178
+ 2.9455188224092126,
179
+ 2.9553074492141604,
180
+ 2.8932162523269653,
181
+ 2.8948449539020658,
182
+ 2.9312765803188086,
183
+ 2.957497867755592,
184
+ 2.9412788785994053,
185
+ 2.92288317438215,
186
+ 2.90363381896168,
187
+ 2.9121988248080015,
188
+ 2.9443688839673996,
189
+ 2.92967183701694,
190
+ 2.9383257618173957,
191
+ 2.936237631365657,
192
+ 2.9386482974514365,
193
+ 2.866082170046866,
194
+ 2.9549760092049837,
195
+ 2.9382486511021852,
196
+ 2.9393330961465836,
197
+ 2.9096426740288734,
198
+ 2.9020523242652416,
199
+ 2.8764873230829835,
200
+ 2.866682286374271,
201
+ 2.8484197529032826,
202
+ 2.876657772809267,
203
+ 2.8896455531939864,
204
+ 2.8590773958712816,
205
+ 2.8490395583212376,
206
+ 2.851007671095431,
207
+ 2.8585843229666352,
208
+ 2.9355735015124083,
209
+ 2.8678584871813655,
210
+ 2.8540887301787734,
211
+ 2.862025871872902,
212
+ 2.864875106140971,
213
+ 2.8861198937520385,
214
+ 2.868556930683553,
215
+ 2.8809032710269094,
216
+ 2.892993056215346,
217
+ 2.876742821186781,
218
+ 2.8865705197677016,
219
+ 2.87214616779238,
220
+ 2.8668526308611035,
221
+ 2.8589779138565063,
222
+ 2.865345064550638,
223
+ 2.864395532757044,
224
+ 2.88478621840477,
225
+ 2.87119064014405,
226
+ 2.8600213192403316,
227
+ 2.8527998933568597,
228
+ 2.8860297724604607,
229
+ 2.886469369754195,
230
+ 2.893052900210023,
231
+ 2.910357383079827,
232
+ 2.9132279176265,
233
+ 2.8915587989613414,
234
+ 2.9142491733655334,
235
+ 2.918264406733215,
236
+ 2.8752056267112494,
237
+ 2.8923414312303066,
238
+ 2.879175373353064,
239
+ 2.897947857156396,
240
+ 2.878804001957178,
241
+ 2.877884665504098,
242
+ 2.8997547142207623,
243
+ 2.8672706820070744,
244
+ 2.8854733603075147,
245
+ 2.899583948776126,
246
+ 2.8933304008096457,
247
+ 2.9642009381204844,
248
+ 2.9584755459800363,
249
+ 2.958104996010661,
250
+ 2.8852866739034653,
251
+ 2.9612151719629765,
252
+ 2.933073801919818,
253
+ 2.905569947324693,
254
+ 2.895676862448454,
255
+ 2.965002312324941,
256
+ 2.897310052998364,
257
+ 2.894599227234721,
258
+ 2.876689209602773,
259
+ 2.8785693757236004,
260
+ 2.8887558514252305,
261
+ 2.9644072875380516,
262
+ 2.957297394052148,
263
+ 2.9762211414054036,
264
+ 2.9696932984516025,
265
+ 2.89720113016665,
266
+ 2.870763665996492,
267
+ 2.859030299820006,
268
+ 2.873627556487918,
269
+ 2.888411758467555,
270
+ 2.875111444853246,
271
+ 2.869182980619371,
272
+ 2.855742915533483,
273
+ 2.8318322375416756,
274
+ 2.85879014339298,
275
+ 2.8607146330177784,
276
+ 2.8892394937574863,
277
+ 2.889393324032426,
278
+ 2.8640042385086417,
279
+ 2.864895386621356,
280
+ 2.881627912633121,
281
+ 2.8623299077153206,
282
+ 2.870918257161975,
283
+ 2.8800062220543623,
284
+ 2.8896107506006956,
285
+ 2.8806260097771883,
286
+ 2.8907636739313602,
287
+ 2.8802124094218016,
288
+ 2.9000131618231535,
289
+ 2.8791921930387616,
290
+ 2.879103073850274,
291
+ 2.863607711158693,
292
+ 2.8859146125614643,
293
+ 2.8826688900589943,
294
+ 2.883101955987513,
295
+ 2.8818365577608347,
296
+ 2.9110373854637146,
297
+ 2.900406298227608,
298
+ 2.9013486057519913,
299
+ 2.8826871812343597,
300
+ 2.9449511794373393,
301
+ 2.8626034427434206,
302
+ 2.8796125492081046,
303
+ 2.8574486561119556,
304
+ 2.8672727392986417,
305
+ 2.8586518662050366,
306
+ 2.866157935000956,
307
+ 2.8607459645718336,
308
+ 2.8829027032479644,
309
+ 2.8827389432117343
310
+ ]
311
+ },
312
+ "throughput": {
313
+ "unit": "tokens/s",
314
+ "value": 0.34725509913982344
315
+ },
316
+ "energy": null,
317
+ "efficiency": null
318
+ }
319
+ }