framework,version,device,op_name,kernel_source,gemm_dtype,m,n,k,latency
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,12288,30.9057854546441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,16384,40.87378946940104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,10240,26.558144463433162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,16384,62.248799641927086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,51200,132.84449598524307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,12288,48.54351467556424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,8192,26.297317504882812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,10240,39.32591417100694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,7168,21.477293226453995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,8192,45.794582790798614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,7168,37.09862263997396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,10240,52.937350802951386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,12288,63.961581759982636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,8192,31.567491319444443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,6144,17.973054673936634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,7168,28.183096991644963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,5120,14.64576382107205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,6144,31.939154730902775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,16384,88.34246826171875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,4096,11.375004238552519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,5120,20.01108635796441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,5120,26.65186055501302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,3584,10.230755276150173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,4096,21.393853081597225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,51200,204.4022894965278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,3584,13.687641567654081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,3072,9.105811225043402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,3584,18.723229302300346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,2560,7.60585700141059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,3072,11.723971896701388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,3072,14.420652601453993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,2560,8.948562622070312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,2560,8.979693094889322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,2048,6.296665615505642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,1536,4.631466759575738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,2048,6.542539384629991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,1536,4.743509504530165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,1024,3.2907271915011935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,1536,4.975888146294488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,1024,3.3435120052761502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,1024,3.65031009250217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,768,2.2686434851752386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,768,2.65555911593967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,512,1.9643546210394964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,768,2.901602639092339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,512,2.0359439849853516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,256,1.3923590977986653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,512,2.1355618370903864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,256,1.7962303161621094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,128,1.0059839884440105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,256,1.4947332806057398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,64,0.735454241434733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,128,1.7115110821194117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,6144,23.216790093315975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,65536,32,0.7943538029988607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,64,1.7198799981011286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,32,2.1924071841769748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,4096,15.566099378797743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,2048,6.54495832655165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,65536,128,1.1213661829630535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,16384,40.53270467122396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,51200,105.6640353732639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,65536,51200,264.70968967013886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,65536,141.319091796875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,16384,70.40665011935764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,12288,26.216428968641495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,16384,50.43328518337674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,10240,22.960188123914932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,12288,37.742655436197914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,12288,50.826093885633675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,8192,18.32971021864149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,10240,42.06053331163194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,7168,15.149442884657118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,51200,208.61915418836804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,8192,24.825347900390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,8192,35.899078369140625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,6144,13.640931023491753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,51200,162.06840006510416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,7168,20.454966227213543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,7168,29.39437527126736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,5120,11.587222629123263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,6144,25.33975897894965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,10240,30.724294026692707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,6144,19.141937255859375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,5120,15.580925835503471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,4096,8.887566460503473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,5120,21.136859469943577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,65536,210.133544921875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,3584,8.445253160264757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,4096,16.955274793836804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,4096,12.282149420844185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,3072,6.877274831136067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,3584,10.753482394748263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,3584,14.835666232638888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,2560,5.665647294786241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,2048,4.766224755181207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,3072,11.458593580457899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,3072,9.394096374511719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,2560,7.058113945855035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,2560,7.101384904649522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,2048,5.149710337320964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,1536,3.6957227918836804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,1024,2.564140531751845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,1536,3.7710088094075522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,2048,5.377927992078994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,768,1.809101316663954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,1536,3.982347700330946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,512,1.5362133449978297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,768,2.097291522555881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,1024,2.6167093912760415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,768,2.2469075520833335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,1024,2.8341937594943576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,128,0.6654711299472386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,256,1.1952550676133897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,256,1.1877582338121202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,512,1.6639555825127497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,256,1.4122177759806316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,512,1.6554462644788954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,128,1.3537591298421223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,32,0.5816951327853733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,51200,64,0.7073342005411783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,64,1.350205315483941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,32,1.7200489044189453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,51200,65536,290.98768446180554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,16384,11.366624620225695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,51200,128,0.8874408933851453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,51200,33.83600192599827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,16384,24.97217305501302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,12288,8.84204355875651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,65536,44.51097276475695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,16384,16.31590101453993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,10240,7.397051493326823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,12288,12.565378824869791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,51200,54.115861680772575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,12288,18.116353352864582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,8192,5.887831793891059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,10240,10.044810824924046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,10240,14.9318118625217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,7168,4.9574809604220915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,8192,8.367312961154514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,8192,12.672706604003906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,7168,7.221537272135417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,6144,4.712937672932942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,7168,10.219158596462673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,65536,70.34109836154514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,5120,3.7054926554361978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,51200,74.73234049479167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,6144,7.400006612141927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,6144,6.221248202853733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,4096,2.8729154798719616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,5120,4.843038347032335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,5120,5.002957238091363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,3584,2.80641598171658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,4096,3.6911849975585938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,3072,2.369394726223416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,3584,3.148227479722765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,3584,3.4086507161458335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,4096,3.9121492173936634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,3072,2.548110326131185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,2560,1.9507821400960286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,2048,1.5931208928426106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,2560,2.155029296875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,2048,1.7642879486083984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,2560,2.4291458129882812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,1536,1.1801377402411568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,1024,0.7152373525831434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,2048,1.9720115661621094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,1024,0.995123545328776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,3072,2.9742461310492625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,1536,1.5172861946953669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,768,0.6252382066514757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,1536,1.4170239766438801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,1024,1.0955688688490126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,768,0.7872168752882215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,512,0.405149327384101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,256,0.28749243418375653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,512,0.6082364188300239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,128,0.2765137884351942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,768,0.8544435501098633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,256,0.45043643315633136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,64,0.212299558851454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,256,0.49930667877197266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,512,0.7361671129862467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,128,0.47455109490288633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,16384,32,0.18132355478074816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,64,0.4421608977847629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,32,0.5361288918389214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,16384,65536,103.37225341796875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,51200,24.9448479546441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,16384,8.495314704047308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,65536,31.033030192057293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,12288,6.405890570746528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,16384,128,0.33037956555684406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,16384,13.512385050455729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,16384,19.347685072157116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,10240,5.380816989474827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,51200,46.2720947265625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,12288,10.196931627061632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,12288,14.292748345269096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,8192,4.569672054714627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,8192,7.802183363172744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,10240,8.500024583604601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,10240,11.667674594455294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,7168,3.5945866902669272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,8192,6.683199988471137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,65536,58.05303276909722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,51200,59.243184407552086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,6144,3.488979551527235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,7168,5.794461144341363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,7168,5.74578136867947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,5120,2.608859592013889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,6144,4.710081736246745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,5120,3.68354500664605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,6144,4.830060323079427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,5120,3.9125900268554688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,4096,2.3969972398546004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,4096,2.9084479014078775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,3584,2.4378729926215277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,4096,3.138341267903646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,3072,1.8376719156901042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,3584,2.430084440443251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,3584,2.7808746761745877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,3072,2.1058336893717446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,2560,1.7487413618299696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,2048,1.220303111606174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,2560,1.7829049428304036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,3072,2.411864810519748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,2048,1.4571662478976781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,1536,0.8775822321573893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,2560,1.9938969082302516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,2048,1.6048630608452692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,1024,0.562687979804145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,1536,1.2549777560763888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,768,0.444355567296346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,1024,0.810272905561659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,1536,1.2578941980997722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,768,0.6322542296515571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,512,0.33291999499003094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,256,0.21993422508239746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,128,0.164938661787245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,512,0.6087777879503038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,512,0.5370373196072048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,768,0.9454515245225695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,256,0.3847786585489909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,1024,1.2169715033637154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,256,0.4138791031307644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,64,0.13206488556332058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,12288,32,0.13782844278547499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,128,0.36547109815809464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,64,0.3486791186862522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,32,0.36520976490444607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,12288,65536,80.29688856336806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,16384,7.19468010796441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,51200,19.82030741373698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,65536,27.43917677137587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,16384,12.152666727701822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,12288,5.9259156121148004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,16384,17.113622029622395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,12288,128,0.2627200020684136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,10240,5.062297821044922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,51200,40.03200954861111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,12288,9.10843234592014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,12288,12.585244072808159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,8192,4.038571675618489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,10240,9.103961520724827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,10240,7.592100355360244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,8192,5.790870242648655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,7168,3.2774088117811413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,8192,5.7581999037000875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,6144,2.6089564429389105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,7168,4.826346503363715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,51200,51.778523763020836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,7168,4.9152170817057295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,6144,3.7332835727267795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,5120,2.1386915842692056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,65536,52.41144816080729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,4096,1.8760515848795574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,5120,3.159088982476128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,6144,4.224286397298177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,3584,1.4566755294799805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,4096,2.4707938300238714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,5120,3.5185165405273438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,4096,2.794827567206489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,3072,1.4818489286634657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,2560,1.1110995610555012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,3584,2.1869884067111545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,3072,1.9090773264567058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,3584,2.5093396504720054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,2048,0.986061308119032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,3072,2.200089772542318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,2560,1.5709848403930664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,1536,0.6747306717766656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,1024,0.44398045539855957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,2048,1.2808204227023654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,2560,1.8044196234809027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,1536,1.1366959677802193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,2048,1.4872319963243272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,768,0.3458328776889377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,1536,1.1393413543701172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,1024,0.8196044498019748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,512,0.24620355500115287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,768,0.5610737800598145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,1024,1.0405990812513564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,256,0.1825031174553765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,512,0.4831226666768392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,512,0.49958488676283097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,768,0.6512106789482964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,128,0.15760266780853271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,256,0.3330684502919515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,64,0.1126684480243259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,256,0.3207520114050971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,128,0.30493066045973033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,10240,32,0.11824177371131049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,64,0.31904978222317165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,32,0.29706401295132107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,10240,65536,69.87306722005208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,16384,5.58368640475803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,51200,16.661446465386284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,65536,23.76037089029948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,16384,10.801767137315538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,12288,4.228356255425347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,16384,12.9600830078125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,10240,3.8030196295844187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,12288,8.273034837510851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,12288,7.976283603244358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,10240,128,0.22851199573940703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,10240,6.101843516031901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,51200,35.63771226671007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,8192,3.2863822513156467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,7168,2.5646692911783853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,8192,4.333591885036893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,10240,6.530869377983941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,7168,3.7895554436577688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,8192,5.0068338182237415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,51200,43.438568115234375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,6144,2.3550870683458114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,5120,1.9010151757134333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,7168,4.329181247287326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,6144,3.239990234375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,5120,2.699025683932834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,4096,1.4804613325330946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,6144,3.7506311204698353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,65536,46.41350979275174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,3584,1.1811502244737413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,5120,3.1032808091905384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,4096,2.141498565673828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,3072,1.001572397020128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,4096,2.551208919949002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,2560,0.9455359776814779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,3584,1.8937786950005426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,3584,2.2024214002821183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,2048,0.8228266504075793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,3072,1.663895077175564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,3072,1.9045946333143446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,2048,1.1214941872490776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,1536,0.5209466616312662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,2560,1.6694382561577692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,1024,0.36914398935106063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,1536,0.8664791319105359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,768,0.2880062262217204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,1536,1.0128862592909071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,2048,1.3047591315375435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,1024,0.8607208993699816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,512,0.20912799570295545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,768,0.48097599877251523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,1024,0.7254346741570367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,256,0.1616977718141344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,512,0.365955564710829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,2560,1.413958231608073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,128,0.13577955298953587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,256,0.2786124547322591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,256,0.2744639979468452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,64,0.11246932877434625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,768,0.7354248894585503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,8192,32,0.09295555618074204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,128,0.19441600640614828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,128,0.24290132522583008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,64,0.23550844192504883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,32,0.24798843595716688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,8192,512,0.4295910994211833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,16384,5.171750386555989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,8192,65536,58.576938205295136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,51200,15.083151923285591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,16384,9.947115580240885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,16384,10.98145972357856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,12288,3.9788487752278647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,65536,20.76746283637153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,10240,3.459379620022244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,12288,6.836374918619792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,12288,7.259925842285156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,10240,5.303138732910156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,8192,2.657531526353624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,10240,5.877382914225261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,7168,2.163976033528646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,8192,3.9665573967827688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,8192,4.643492380777995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,6144,2.1080203586154513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,7168,3.5658285352918835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,7168,4.04511472913954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,5120,1.617979579501682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,6144,3.0183262295193143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,51200,33.33692423502604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,6144,3.4646470811631946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,4096,1.2207084231906467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,5120,2.5199271308051214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,4096,1.9892569647894964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,3584,1.1134701834784615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,51200,36.82122124565972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,5120,2.909207026163737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,3072,1.0449084175957573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,3584,1.7567431131998699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,4096,2.359419504801432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,3072,1.524776882595486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,2560,0.8397066858079699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,3072,1.789788352118598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,3584,2.0633040534125433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,2048,0.614666673872206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,2560,1.2767315970526802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,1536,0.48288975821601016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,1024,0.324160893758138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,2560,1.506856918334961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,2048,1.2323680453830295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,2048,1.1423252953423393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,768,0.25677598847283256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,1536,0.948971536424425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,512,0.19077689117855498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,1024,0.6781893306308322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,1024,0.8165635532803006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,256,0.13065600395202637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,768,0.585244443681505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,512,0.3397342099083795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,512,0.3921822177039252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,128,0.096852441628774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,256,0.261553790834215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,256,0.2573057810465495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,64,0.08515822225146824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,128,0.21762488947974312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,7168,32,0.0903066661622789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,1536,1.0294240315755208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,64,0.21198488606346977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,32,0.2094177802403768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,768,0.44780445098876953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,65536,43.0301513671875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,7168,65536,51.47411431206597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,16384,4.405524359809028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,51200,14.064431932237413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,65536,16.57538011338976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,12288,3.249494128757053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,16384,9.150677998860678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,16384,9.538831075032553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,12288,5.689985063340928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,10240,2.7186417049831815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,10240,4.641783820258246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,12288,6.634076436360677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,51200,31.840498182508682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,10240,5.482320149739583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,8192,2.299309412638346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,51200,30.823164198133682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,8192,3.7231424119737415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,7168,2.060910118950738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,7168,128,0.1774302191204495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,7168,3.211470286051432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,6144,1.808269288804796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,8192,4.333633846706815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,5120,1.3621208402845595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,7168,3.7998682657877603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,6144,2.7666524251302085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,4096,1.1051173739963107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,6144,3.258581373426649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,5120,2.3349626329210067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,5120,2.7368426852756076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,3584,0.9114916059705945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,4096,1.8555164337158203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,4096,2.212381362915039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,3072,0.7802151044209799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,3584,1.6234631008572047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,65536,39.99270290798611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,2560,0.6368888749016656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,3584,1.9434649149576824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,3072,1.4521155887179906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,3072,1.6899003982543945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,2048,0.5273057619730631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,1536,0.40335644616021055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,2560,1.2782284418741863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,2560,1.4182888666788738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,1024,0.2665804492102729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,2048,1.0370844735039604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,1536,0.7447653346591525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,768,0.21450755331251356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,2048,1.1555004119873047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,1024,0.5294488800896539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,512,0.1625022225909763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,768,0.41034844186570907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,1536,0.9349031448364258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,1024,0.634119987487793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,256,0.14074488480885824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,512,0.3054080009460449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,128,0.08278933498594496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,768,0.49891111585828996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,64,0.06914222240447998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,65536,43.09361436631945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,512,0.3634177843729655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,256,0.22413510746426055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,256,0.23199733098347983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,6144,128,0.16033689181009927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,128,0.2666089004940457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,6144,32,0.07412088579601712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,64,0.18243822786543104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,6144,32,0.18122755156622994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,16384,3.4360489315456815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,16384,7.389539930555556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,51200,11.330603705512154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,12288,2.923599031236437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,16384,8.32489013671875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,10240,2.302471160888672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,65536,15.739145914713541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,12288,5.0747252570258246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,8192,1.8607813517252605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,12288,6.089399125840928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,10240,4.228662278917101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,7168,1.5813413196139867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,10240,5.081740485297309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,8192,3.3503040737575955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,8192,4.0542043050130205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,6144,1.4347955915662978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,7168,2.9600550333658853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,7168,3.5610309176974826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,5120,1.08806398179796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,6144,2.5387395222981772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,51200,25.802242702907986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,4096,0.8718791007995605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,5120,2.1237244076199002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,6144,3.0641458299424915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,3584,0.7107466591729058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,4096,1.7023021909925673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,5120,2.572863048977322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,3072,0.6073377927144369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,4096,2.079947577582465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,3584,1.4881359736124675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,2560,0.5477386580573188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,51200,28.420701768663193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,3072,1.2893760469224718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,2560,1.0861821704440646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,2048,0.43707021077473956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,3584,1.8345618777804906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,1536,0.3343946668836806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,2048,0.8857262399461535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,3072,1.6043057971530492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,1024,0.2410693433549669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,1536,0.6787581973605685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,2560,1.359050644768609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,768,0.17376532819535997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,2048,1.0849315855238173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,1024,0.48156176673041445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,512,0.13609245088365343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,768,0.3717679977416992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,1024,0.6390159924825033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,1536,0.8768204583062066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,768,0.4717804590861003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,256,0.09214399920569526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,128,0.07152266634835137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,512,0.33392800225151914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,256,0.200619551870558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,64,0.06126488579644097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,128,0.16553866863250732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,5120,32,0.06571733289294772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,128,0.14499821927812365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,64,0.15632000234391955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,32,0.15228533744812012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,512,0.2753688759273953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,256,0.21043199963039824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,5120,65536,35.93358696831597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,5120,65536,37.593536376953125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,16384,2.8204871283637156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,51200,9.067237006293402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,12288,2.105326122707791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,65536,11.397505866156685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,16384,6.2520018683539496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,10240,2.0492195553249783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,16384,7.6001985337999125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,12288,4.624065823025174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,12288,5.663393656412761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,8192,1.4444888432820637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,10240,3.854864756266276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,10240,4.71212641398112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,8192,3.0571475558810763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,7168,1.3524257871839735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,8192,3.790493435329861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,6144,1.3916764789157445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,7168,2.688976075914171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,5120,0.8072720103793674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,7168,3.328158272637261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,51200,23.112438625759548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,6144,2.317333433363173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,4096,0.6717822286817762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,6144,2.8667040930853953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,4096,1.5439537896050348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,5120,1.9437476264105902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,3584,0.5883973439534506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,5120,2.4041199154324002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,3072,0.5621084637112087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,4096,1.9465306599934895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,3584,1.3589440451727972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,2560,0.430478228463067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,51200,25.954211764865452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,3584,1.7054239908854167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,2048,0.33068977461920845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,3072,1.3531324598524306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,3072,1.4740542305840387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,2560,1.0433804194132488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,1536,0.260079993142022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,1024,0.1772488885455661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,2560,1.2451057434082031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,2048,0.8410444259643555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,768,0.13571911387973362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,1536,0.6170133484734429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,2048,1.0070568720499675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,512,0.11064533392588298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,1536,0.7761262257893881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,1024,0.5113617579142252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,1024,0.5472488933139378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,256,0.07269689109590319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,768,0.3374737898508708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,128,0.05683466460969713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,512,0.24519644843207467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,512,0.3041235605875651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,256,0.1915217770470513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,256,0.17023821671803793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,64,0.04745066828197903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,128,0.12628444035847983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,4096,32,0.04855288730727302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,128,0.1399866607454088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,65536,30.109792073567707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,64,0.13065866629282633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,4096,32,0.12450044684939915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,768,0.4253191153208415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,16384,2.624551984998915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,4096,65536,33.855919731987846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,51200,8.933816697862413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,16384,5.919216156005859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,12288,2.0727547539605036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,65536,11.671190049913195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,16384,7.317525227864583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,10240,1.6519076029459636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,12288,4.385367075602214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,8192,1.205500496758355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,10240,3.6503991021050344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,12288,5.463653140597874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,10240,4.556753794352214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,7168,1.102295133802626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,8192,2.9158852895100913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,6144,0.8096506860521105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,8192,3.6625518798828125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,7168,2.5612426333957248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,51200,20.606904771592884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,5120,0.7066035800509982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,7168,3.2122372521294484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,4096,0.5907697677612305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,6144,2.7682168748643665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,5120,1.8419812520345051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,6144,2.1976941426595054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,3584,0.49701690673828125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,4096,1.4847190645005968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,5120,2.3244080013699002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,3584,1.2909751468234592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,4096,1.8725573221842449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,3072,0.42765243848164874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,2560,0.36661243438720703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,3584,1.6566658020019531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,3072,1.117054197523329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,2048,0.3202853202819824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,2560,0.966984854804145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,1536,0.2350755532582601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,3072,1.4224533504909938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,65536,26.038291083441838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,2560,1.2152569029066298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,2048,0.764119995964898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,1024,0.15861599975162083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,51200,24.789133707682293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,768,0.13237599531809488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,1536,0.6563119888305664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,2048,0.9719644122653537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,1024,0.41302932633294004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,1536,0.7454071044921875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,512,0.09139377541012234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,1024,0.5230328771803114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,256,0.06352800130844116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,128,0.05474755499098036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,256,0.15922399361928305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,512,0.2297875616285536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,256,0.1748053365283542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,512,0.28960977660285103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,768,0.3168231116400825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,768,0.41086400879753965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,64,0.047015110651652016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3584,32,0.04827466607093811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,128,0.12703643904791936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,64,0.11543999777899848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3584,32,0.11046755313873291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,65536,31.899858262803818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,51200,7.527905782063802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,65536,9.149109734429254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,16384,2.0182728237575955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,12288,1.5210498174031575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,16384,5.506397247314453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,12288,4.1521992153591585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,16384,7.040809631347656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,10240,1.3175332811143663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,12288,5.254790412055121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,51200,18.870225694444446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,8192,1.0480115678575304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,10240,3.472868389553494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,7168,0.9583715862698026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,10240,4.395154741075304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,8192,2.770626703898112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,6144,0.8143439822726779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,7168,2.4402311113145614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,8192,3.529895994398329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,51200,23.71500311957465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,5120,0.6447075737847222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,7168,3.0983128017849393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,65536,25.025500827365452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,4096,0.48103290134006077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,6144,2.09080441792806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,3584,0.45176177554660374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,5120,1.7390648523966472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,6144,2.6709200541178384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,3072,0.3715244399176703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,5120,2.239198260837131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,4096,1.8163912031385634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,3584,1.2609181933932834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,2560,0.3192568884955512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,3584,1.5834461847941081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,3072,1.0852008395724826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,2048,0.27800533506605357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,2560,0.8916364245944552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,3072,1.3679786258273656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,1536,0.20251733726925322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,2048,0.7243306901719836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,4096,1.3919066323174372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,1024,0.14328000280592176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,2560,1.1675262451171875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,1536,0.553616894616021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,768,0.10193777746624416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,2048,0.9594435162014432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,512,0.07639200157589383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,768,0.2985600100623237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,1536,0.7404790984259711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,1024,0.38694487677680117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,256,0.057327999009026416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,1024,0.5120382308959961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,768,0.38871023390028214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,512,0.21474756134880912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,128,0.043875555197397866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,256,0.14276799890730116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,512,0.27480800946553546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,256,0.1653439998626709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,32,0.03917333483695984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,128,0.10917333099577163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,128,0.11358933978610569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,64,0.10196799702114528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,3072,32,0.0980328917503357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3072,65536,30.522210015190975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,3072,64,0.037907554043663874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,16384,1.8096995883517797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,51200,5.778717464870876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,3584,128,0.11744533644782172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,65536,7.5672107272677955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,12288,1.2818542056613498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,16384,5.282268524169922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,10240,1.1228746838039823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,12288,3.8989457024468313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,16384,6.747467464870876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,12288,5.063133239746094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,10240,3.278671900431315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,8192,0.8742853270636665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,7168,0.8540444374084473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,8192,2.6170692443847656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,10240,4.228729671902127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,6144,0.6357057889302572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,8192,3.4058329264322915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,7168,2.2958265940348306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,5120,0.4999217987060547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,51200,17.778210110134548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,7168,2.9813412560356984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,6144,1.9781608581542969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,4096,0.45617156558566624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,6144,2.5699475606282554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,5120,1.6625635359022353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,3584,0.3726773262023926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,4096,1.3166755040486653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,5120,2.1482550303141275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,3072,0.3158622317843967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,3584,1.1595564948187935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,4096,1.7485253016153972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,2560,0.2889600065019396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,3584,1.5356053246392145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,3072,1.001450644599067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,2048,0.22448711925082734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,3072,1.3238346311781142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,2560,0.8410071267022027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,1536,0.1553573343488905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,2048,0.6822444597880045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,2560,1.1284159554375541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,1024,0.11568355560302734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,2048,0.9081368976169162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,1536,0.5272524621751573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,768,0.08095288938946195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,1536,0.6856506665547689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,1024,0.47870397567749023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,768,0.28096622890896267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,512,0.0697537793053521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,768,0.3700088924831814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,256,0.045626666810777455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,65536,22.371414184570312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,512,0.1998142268922594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,512,0.2596408791012234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,256,0.12946577866872153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,256,0.15252799457973903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,128,0.037809779246648155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,64,0.03506933318244086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,128,0.10143111149470012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2560,32,0.03709333472781711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,64,0.0888177752494812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,51200,22.737123277452255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,32,0.08329777585135566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2560,1024,0.3647760020362006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,128,0.10046399964226617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,16384,1.3947697745429144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,51200,4.959791819254558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2560,65536,29.027950710720486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,65536,5.623325347900391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,12288,0.9845857620239258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,16384,4.957579718695746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,10240,0.838405344221327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,12288,3.6919742160373263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,12288,4.871307373046875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,16384,6.477078331841363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,10240,3.0900561014811196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,8192,0.6685262256198459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,7168,0.643979549407959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,10240,4.067571428087023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,8192,2.466302235921224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,6144,0.49837419721815324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,8192,3.275100496080187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,7168,2.171919080946181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,5120,0.4159253438313802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,51200,16.06035698784722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,7168,2.865067587958442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,6144,1.8638746473524306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,4096,0.34282488293117946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,5120,1.5635022057427301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,6144,2.469672097100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,3584,0.26968712276882595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,4096,1.2458808686998155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,3072,0.23813332451714408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,5120,2.061127132839627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,4096,1.6720764372083876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,2560,0.23027645217047799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,3584,1.0942089292738173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,3072,0.9533813264634875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,3584,1.4592231114705403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,2048,0.1539751158820258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,2560,0.8139315711127387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,3072,1.2583689159817166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,1536,0.13264977931976318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,2560,1.05913511912028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,2048,0.6407404475741917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,1024,0.09465510977639092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,1536,0.49053155051337344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,65536,20.43283928765191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,2048,0.8644195662604438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,768,0.07154666715198092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,1024,0.3410222265455458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,512,0.056701335642072886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,1536,0.6677218013339572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,256,0.035981333918041654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,1024,0.4560942120022244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,512,0.18418310748206246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,768,0.35259556770324707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,768,0.2612160046895345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,256,0.1153893338309394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,128,0.03022577696376377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,256,0.14208622773488364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,64,0.025791111919615004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,2048,32,0.02606577840116289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,128,0.0922693345281813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,128,0.08875822358661228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,64,0.07523377736409505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,2048,32,0.06959111160702176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,51200,21.798543294270832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,512,0.24495911598205566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,16384,1.0996987024943035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,51200,3.463945812649197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,65536,4.5759663052029085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,12288,0.870431105295817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,2048,65536,27.89301045735677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,16384,4.602486928304036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,10240,0.637529797024197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,12288,3.4665741390652127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,16384,6.215497758653428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,10240,2.8844114939371743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,8192,0.4865724245707194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,12288,4.67268541124132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,7168,0.46991289986504453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,8192,2.31169064839681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,10240,3.9047876993815103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,6144,0.3999626636505127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,7168,2.034299638536241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,8192,3.138475630018446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,51200,14.838233100043404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,5120,0.3318871127234565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,6144,1.7515040503607855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,4096,0.2637146578894721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,7168,2.745664808485243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,5120,1.4567173851860895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,3584,0.2326942284901937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,5120,1.982012430826823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,4096,1.1848942438761394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,3072,0.20160888301001656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,3584,1.0444311565823026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,4096,1.5895653830634222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,2560,0.16887377368079293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,6144,2.359210756089952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,3584,1.3980862299601238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,2048,0.1404871145884196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,65536,18.873804728190105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,3072,0.8958062065972222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,1536,0.10392355256610447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,2560,0.7563893530103895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,3072,1.2033750745985243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,1024,0.0741128921508789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,2048,0.6004648738437229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,2560,1.0092088911268446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,1536,0.4574711057874892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,768,0.05948177973429362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,1024,0.317758215798272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,1536,0.6243511305914985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,512,0.043362667163213096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,2048,0.8169537650214301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,256,0.02870133188035753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,768,0.33308090103997123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,512,0.16838755872514513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,128,0.02422222163942125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,512,0.22909779018825957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,256,0.10130844513575236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,256,0.13075289461347792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,64,0.020948444803555805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1536,32,0.021511110994550917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,128,0.08318399720721774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,128,0.07533866829342313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,64,0.06200622187720405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,32,0.05565422111087375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1536,768,0.24268089400397408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,1024,0.4321964316897922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,51200,20.88741726345486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,16384,0.6911422411600748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,51200,2.3961156209309897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,65536,3.0993003845214844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,12288,0.5815902286105686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1536,65536,26.731686062282986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,16384,4.302588568793403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,12288,3.2314453125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,10240,0.46737511952718097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,16384,5.947621239556207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,8192,0.3524266613854303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,10240,2.695975197686089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,12288,4.476580301920573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,10240,3.7356524997287326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,8192,2.161191940307617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,7168,0.3155306710137261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,6144,0.2751235432094998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,8192,2.9963075849745007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,7168,1.8915555742051866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,5120,0.2512044376797146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,6144,1.6364417605929906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,7168,2.6252354515923395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,4096,0.18777067131466338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,51200,13.579948425292969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,5120,1.371707598368327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,3584,0.17354488372802734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,6144,2.257708443535699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,4096,1.097866694132487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,5120,1.8873511420355902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,3072,0.13131733735402426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,4096,1.5172355439927843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,3584,0.9590924580891927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,2560,0.11827199988894993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,3072,0.8249982198079427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,2048,0.09631999995973374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,3584,1.3310168584187825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,3072,1.1491279602050781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,2560,0.6912248929341634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,1536,0.07260177532831828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,2048,0.5590560171339247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,2560,0.9609662161933051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,65536,17.31373765733507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,1536,0.42428888214959043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,768,0.041598220666249595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,2048,0.7772800127665201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,1536,0.591743999057346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,1024,0.2920284536149767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,512,0.025054223007626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,768,0.22324087884691027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,1024,0.4075982305738661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,512,0.15114843845367432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,768,0.3139466709560818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,256,0.019706666469573975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,512,0.21307199531131318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,128,0.016014221641752455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,256,0.08683111270268758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,256,0.11944799953036839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,64,0.014468444718254937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,128,0.07475466860665216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,128,0.06202489137649536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,32,0.014811555544535318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,1024,1024,0.05076533224847582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,64,0.04858577913708157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,1024,32,0.04231466518508064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,51200,1.8271804385715062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,65536,2.367860370212131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,51200,20.049930148654514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,16384,0.597599983215332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,12288,0.4297928810119629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,12288,3.111461427476671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,16384,4.151250627305773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,10240,0.33212799496120876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,1024,65536,25.62152608235677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,16384,5.845008002387153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,8192,0.2690009011162652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,10240,2.597600089179145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,12288,4.38302485148112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,7168,0.24621333016289604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,8192,2.0853583017985025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,10240,3.659143235948351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,6144,0.22067999839782715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,8192,2.9361902872721353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,7168,1.8231635623508031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,5120,0.16507911682128906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,6144,1.5782426198323567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,51200,13.012519836425781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,4096,0.13690666357676187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,7168,2.5759396023220487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,5120,1.307930628458659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,3584,0.11650666925642227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,4096,1.0516497294108074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,5120,1.8466951582166884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,6144,2.210629357231988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,3072,0.11196977562374538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,4096,1.4861493640475805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,2560,0.09256800015767415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,3584,0.9218426810370551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,3072,0.793967088063558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,2048,0.07482844591140747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,2560,0.6654275788201226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,3584,1.3012142181396484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,1536,0.056886222627427846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,3072,1.1204053031073677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,2560,0.9380480448404948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,1024,0.041489776637819074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,1536,0.4075306786431207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,2048,0.7593510945638021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,768,0.02921244502067566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,1024,0.2791066699557834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,1024,0.3966533342997233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,512,0.020042666130595736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,768,0.3047422303093804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,512,0.14227555857764349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,256,0.015396444333924187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,512,0.20694311459859213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,65536,16.647130330403645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,256,0.11388266086578369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,128,0.013062222136391534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,128,0.05535644292831421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,64,0.012259555359681448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,1536,0.5777937571207682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,768,32,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,128,0.07015733586417304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,64,0.04144710964626736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,32,0.03492000036769443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,768,0.21256532933976915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,2048,0.5368302133348253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,51200,1.2024337980482314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,65536,1.5947848425971136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,16384,0.40220001008775497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,51200,19.647204928927952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,768,256,0.08046578036414252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,12288,0.2704373465643989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,16384,3.9943457709418406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,12288,2.997854232788086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,768,65536,25.138288709852432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,10240,0.2569235430823432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,16384,5.692899492051866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,8192,0.1934293376074897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,10240,2.5069974263509116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,12288,4.2729441324869795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,8192,2.0068143208821616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,10240,3.562310960557726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,7168,0.17511110835605195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,6144,0.1507884396447076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,7168,1.7582186592949762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,8192,2.856809828016493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,5120,0.12219377358754475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,7168,2.5020275115966797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,51200,12.522857666015625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,4096,0.10582044389512803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,6144,1.5096364551120336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,5120,1.259744856092665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,3584,0.08475999699698554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,6144,2.151132371690538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,4096,1.0119529300265842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,3072,0.07895733250512017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,5120,1.794905768500434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,3584,0.8865875667995877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,2560,0.061384002367655434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,4096,1.4434675640530055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,3072,0.7628364562988281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,2048,0.05520177880922953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,3584,1.2654684914482963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,65536,15.975980970594618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,2560,0.6387626859876845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,3072,1.0882417890760634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,1536,0.04169866773817274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,2048,0.51491912206014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,1024,0.02756711178355747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,2560,0.9134239620632596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,768,0.020980444219377305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,1536,0.38956178559197324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,1024,0.26561421818203396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,512,0.015164444843928019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,2048,0.7362088627285428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,768,0.20254045062594941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,1024,0.38312710656060117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,1536,0.5589893129136827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,256,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,128,0.010020444790522257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,768,0.29380178451538086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,512,0.1984257830513848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,256,0.07166488965352376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,256,0.10827733410729302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,64,0.009887110855844285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,128,0.04651644494798449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,512,32,0.01015733347998725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,128,0.0653217766020033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,64,0.03392088744375441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,32,0.02773777809407976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,51200,0.6569893095228407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,65536,0.8432470957438151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,512,512,0.13469333118862575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,16384,0.22652000851101348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,51200,19.21154106987847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,12288,0.1647226678000556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,16384,3.851927863226997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,12288,2.891285366482205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,16384,5.572237226698134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,10240,0.13292977544996473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,512,65536,24.552083333333332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,8192,0.1192035542594062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,12288,4.1856363084581165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,10240,2.411182191636827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,7168,0.09879555304845174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,8192,1.9340214199490016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,10240,3.4939083523220487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,6144,0.09102400143941243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,7168,1.6913252936469183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,8192,2.796971638997396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,6144,1.452721807691786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,5120,0.07502044571770562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,51200,12.055511474609375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,7168,2.44908078511556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,4096,0.06029511160320706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,4096,0.9730968475341797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,3584,0.0514613323741489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,5120,1.212227503458659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,6144,2.1046568552652993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,3072,0.04397066765361362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,4096,1.4102168613009984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,5120,1.7573955323961046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,2560,0.038070221741994224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,3584,0.8531822098626031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,3072,0.733284420437283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,2048,0.03047910994953579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,2560,0.6131786770290798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,3584,1.2385066350301106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,1536,0.023676445086797077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,2048,0.49410491519504124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,3072,1.0636133617824979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,1024,0.014328888720936246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,1536,0.37415467368231875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,2560,0.8903946346706815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,768,0.011824888487656912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,65536,15.3849605984158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,1024,0.25470932324727374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,2048,0.7187902132670084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,512,0.009316444396972656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,1536,0.5462649133470323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,768,0.19362933105892607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,1024,0.3728782335917155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,512,0.12765422132280138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,512,0.19037332799699572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,256,0.06516089042027791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,768,0.2848400010002984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,128,0.006911110960774952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,256,0.10467288891474406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,64,0.007136888802051544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,32,0.0069724445541699724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,128,0.06016888883378771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,128,0.03769777880774604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,64,0.027129777603679236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,256,32,0.02167911165290409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,51200,0.5508515569898818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,65536,0.6996302074856229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,256,256,0.007440889047251807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,16384,0.17944888273874918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,51200,18.80753919813368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,12288,0.13494843906826443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,16384,3.782079908582899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,12288,2.8370969560411243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,10240,0.11262933413187663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,256,65536,24.083816528320312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,10240,2.3664417266845703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,8192,0.09380710787243313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,8192,1.8979555765787761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,51200,11.806209140353731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,7168,0.08522933059268528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,7168,1.6612124972873266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,65536,15.101382785373263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,6144,0.07071555323070951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,6144,1.4260009129842122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,16384,5.503361596001519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,5120,0.0612915555636088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,5120,1.1924515830145943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,12288,4.1394907633463545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,4096,0.05228711167971293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,5120,1.7378062142266169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,4096,0.9560115602281359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,3584,0.04399199949370491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,3584,0.8380888832939996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,4096,1.3949289321899414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,3072,0.038754665189319186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,10240,3.447574191623264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,3584,1.2245324452718098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,3072,0.7210595342848035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,2560,0.03359199894799127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,2560,0.6029609044392904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,2048,0.027652444110976324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,3072,1.0515261756049263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,2560,0.880982240041097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,1536,0.021419554948806763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,2048,0.48543998930189347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,1536,0.36671998765733504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,1024,0.009992889232105678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,2048,0.7103093465169271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,1024,0.24905154440138075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,1536,0.5389448801676432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,768,0.008384889198674096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,1024,0.36551909976535374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,512,0.006931555353932911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,768,0.18907199965582955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,768,0.2799733214908176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,256,0.005559111220969095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,512,0.1238302257325914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,8192,2.7629040612114797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,128,0.00489688871635331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,256,0.06245155466927422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,256,0.10008622540367974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,64,0.004987555659479565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,128,0.034324444002575345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,128,32,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,64,0.024060444699393377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,128,32,0.02027555637889438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,65536,0.644794676038954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,512,0.18600000275505912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,51200,0.49712175793117946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,16384,0.16728444894154867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,7168,2.4236053890652127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,12288,0.12456533643934463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,6144,2.078425725301107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,10240,0.10291110806994969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,16384,3.760933346218533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,12288,2.8264329698350696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,8192,0.0869671106338501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,7168,0.0736666652891371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,10240,2.3578328026665583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,51200,18.597630818684895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,6144,0.06448977523379855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,5120,0.05448444353209602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,8192,1.8912826114230687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,7168,1.654591984219021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,4096,0.045296000109778516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,3584,0.03916177815861172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,5120,1.1860568788316515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,3072,0.03469244307941861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,6144,1.422512902153863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,3584,0.8344968689812554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,2560,0.029151999288135107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,2048,0.024323556158277724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,3072,0.7175288730197482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,1536,0.01423733267519209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,2048,0.4831662178039551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,2560,0.6004320250617133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,1024,0.008436444732877944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,1536,0.3645484447479248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,1024,0.24656711684332955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,768,0.007273777491516537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,512,0.006242666807439592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,4096,0.9508853488498263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,256,0.005088888936572605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,768,0.18726489279005262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,512,0.12219733662075466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,128,0.004179555508825514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,64,0.0041759999261962045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,256,0.06116444534725613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,128,0.03252089023590088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,64,32,0.004880889008442561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,64,0.022638221581776936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,32,0.019215111931165058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,65536,23.840262518988713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,65536,0.7292515436808268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,51200,0.562186665005154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,16384,0.1708142227596707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,12288,0.12780088848537868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,10240,0.1083422236972385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,51200,11.767489115397135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,8192,0.09665689203474258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,10240,2.359988530476888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,12288,2.823229259914822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,7168,0.07777066363228692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,6144,0.06689333253436618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,16384,3.762609693739149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,8192,1.893472883436415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,5120,0.0560471084382799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,4096,0.04660800099372864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,64,65536,15.038665771484375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,3584,0.04059200154410468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,6144,1.422421349419488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,3072,0.0366559988922543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,7168,1.654317326015896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,4096,0.9518604278564453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,2560,0.030782222747802734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,2048,0.024857777688238356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,5120,1.187787585788303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,1536,0.013730666703648038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,3584,0.8365022341410319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,1024,0.008002666963471307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,3072,0.7204026646084256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,2048,0.4843031035529242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,1536,0.3676062160068088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,1024,0.24937333001030815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,768,0.006743999818960826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,512,0.00554933316177792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,256,0.004249777644872665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,128,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,512,0.12422045071919759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,768,0.1886604494518704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,128,0.03253600001335144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,64,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32768,32,32,0.0032248888164758682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,64,0.023688889212078516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,32,0.0192586663696501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,2560,0.601069344414605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,256,0.06105599800745646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32768,128,128,0.058654222223493785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,51200,11.754294501410591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32768,32,65536,15.035786946614584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,16384,20.589767456054688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,12288,18.422941419813366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,16384,30.2227783203125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,10240,16.188891940646702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,12288,32.02792019314236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,12288,23.04561699761285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,16384,44.462073432074654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,8192,11.342073228624132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,7168,8.944096035427517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,10240,20.027391221788196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,8192,15.188418918185763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,10240,26.605066935221355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,8192,22.316326565212673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,51200,69.66499837239583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,6144,8.395589192708334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,7168,13.334255642361112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,6144,12.964870876736112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,5120,8.007571750217014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,5120,8.481944613986546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,7168,18.309968736436634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,6144,10.932414584689669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,4096,5.505596584743923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,5120,8.235489739312067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,3584,4.85659662882487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,4096,6.176578521728516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,3584,5.171018812391493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,4096,6.1561838785807295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,3584,5.239164564344618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,3072,4.527624766031901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,3072,4.282959832085504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,2560,3.67536629570855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,3072,4.634973314073351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,2560,3.6244578891330295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,2560,3.7594256930881076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,1536,2.236144807603624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,2048,2.9668434990776906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,1536,2.2813892364501953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,2048,2.9957474602593313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,2048,3.042788399590386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,1024,1.4590373569064672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,1024,1.651245329115126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,768,1.0906569163004558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,1536,2.4012889862060547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,512,0.7796746889750162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,768,1.278273794386122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,1024,1.7195528878106012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,768,1.3848586612277562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,512,1.0645457373725045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,256,0.7690729035271539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,512,1.1861688825819228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,128,0.4489742385016547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,256,0.9161181979709201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,64,0.35269422001308864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,256,0.7552497651841906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,65536,32,0.36106310950385195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,128,0.8712613317701551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,64,0.894044452243381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,32,0.9937075508965386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,128,0.5709946420457628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,65536,51200,133.41334364149307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,51200,51.676862928602425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,16384,19.222305297851562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,65536,51200,99.30876329210069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,65536,66.46683756510417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,12288,14.290964762369791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,16384,25.05426534016927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,16384,35.05305650499132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,12288,25.344777425130207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,12288,18.73074679904514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,10240,10.587452358669704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,8192,9.436854892306858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,51200,104.98255072699652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,10240,15.134246826171875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,65536,102.21707492404515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,10240,21.069056193033855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,8192,17.852001614040798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,7168,7.701276991102431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,6144,6.500272962782119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,8192,12.124077690972221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,7168,10.498152838812933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,5120,4.891639285617404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,7168,14.486065334743925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,6144,9.74699232313368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,6144,8.678799947102865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,5120,6.757234785291884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,4096,4.272248162163629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,5120,6.490659501817491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,3584,3.907258775499132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,4096,4.97670661078559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,3584,4.196985032823351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,4096,5.007345835367839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,3584,4.208821190728082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,2560,2.721547656589084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,3072,3.3575653500027127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,3072,3.4527138604058156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,2560,2.9183972676595054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,3072,3.6355493333604603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,2048,2.1996434529622397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,2560,3.079527960883247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,2048,2.3379910786946616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,1536,1.7851422627766926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,1536,1.7976364559597438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,2048,2.5472844441731772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,1024,1.272505760192871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,768,0.8399430910746256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,1024,1.3238870832655165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,768,1.0330372916327584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,512,0.6746995713975695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,512,0.8300008773803711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,256,0.6216008928087022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,768,1.1284222073025174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,512,0.832698663075765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,128,0.34908800654941136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,256,0.7218435605367025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,1024,1.470563570658366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,256,0.6421999931335449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,64,0.2697697745429145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,128,0.4758835368686252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,51200,32,0.29028712378607857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,128,0.6850888994004992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,64,0.6931226518419055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,32,0.7852737638685438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,1536,1.8924942016601562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,51200,65536,144.51932779947916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,16384,5.702175140380859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,51200,16.18707444932726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,65536,20.54387749565972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,51200,51200,78.93437364366319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,12288,4.1483438279893665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,16384,9.046695285373264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,16384,12.50103505452474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,10240,3.9059359232584634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,51200,29.970231797960068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,12288,6.830196380615234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,12288,9.002371893988714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,10240,7.551946851942275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,8192,3.139114591810438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,10240,5.622090657552083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,7168,2.428275638156467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,51200,37.5941162109375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,8192,6.242388407389323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,6144,2.0923635694715714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,8192,4.766081915961371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,65536,38.37037489149306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,7168,3.8871536254882812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,7168,5.21293682522244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,5120,1.6694648530748155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,6144,3.3860479990641275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,4096,1.347564485337999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,6144,3.7502318488227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,5120,2.467663023206923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,3584,1.2947911156548393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,5120,2.5436479780409074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,4096,1.9082152048746746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,3584,1.5483706792195637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,3072,1.114524417453342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,4096,1.9670569101969402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,3584,1.741896841261122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,2560,0.8484613100687662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,2048,0.7091351085238986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,3072,1.3293253580729167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,3072,1.4148071077134874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,2560,1.0978506935967338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,2048,0.9199519687228732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,1536,0.5991315311855739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,1024,0.3727315531836615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,2560,1.2599706649780273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,2048,1.0860569212171767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,1536,0.6902586619059244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,1024,0.5044266912672255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,768,0.29016976886325413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,1536,0.7668382326761881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,512,0.21589244736565483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,768,0.39716532495286727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,256,0.1471831136279636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,768,0.4352275530497233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,512,0.3037750985887316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,128,0.1166799995634291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,512,0.4925857649909125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,1024,0.8006746504041883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,64,0.09692266914579604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,256,0.2373510996500651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,256,0.3070026768578423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,128,0.23573954900105795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,16384,128,0.17159110969967314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,16384,32,0.09525333510504828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,32,0.26443200641208225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,64,0.24953778584798178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,16384,4.168029361300998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,16384,65536,51.67005411783854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,51200,12.348518371582031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,16384,7.437127855088975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,16384,9.697241041395399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,12288,3.1851634979248047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,65536,17.440377129448784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,10240,2.787164476182726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,12288,7.081862979465061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,12288,5.628174251980251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,8192,2.261702219645182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,10240,5.862294091118707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,10240,4.632353040907118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,8192,3.8722025553385415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,7168,1.9563075171576605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,51200,24.021397908528645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,8192,3.7678167555067272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,6144,1.7769076029459636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,7168,3.2688977983262806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,7168,2.9537262386745877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,6144,2.18523195054796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,5120,1.5850409401787653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,4096,0.9763707054985894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,6144,2.7257200876871743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,5120,1.7626302507188585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,51200,29.4801262749566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,5120,2.1138025919596353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,3584,0.9672524134318033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,4096,1.4231199688381617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,3072,0.7617866728040906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,4096,1.5830258263481989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,3584,1.2205502192179363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,3584,1.4014808866712782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,2560,0.6805546548631457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,3072,1.2162319819132488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,2560,0.8993377685546875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,3072,1.3851404190063477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,2048,0.5261351267496744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,2560,0.9963164859347873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,1536,0.37021422386169434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,1024,0.27666934331258136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,2048,0.8848417599995931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,1536,0.5654275682237413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,2048,0.8275653521219889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,768,0.20925245020124647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,1024,0.4713199933369954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,1536,0.8215600119696723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,512,0.15163289176093206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,768,0.30823644002278644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,65536,31.965830485026043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,1024,0.5025413301255968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,256,0.1091102229224311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,768,0.35544710689120823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,512,0.2547822263505724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,128,0.08289955721961127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,64,0.0696915586789449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,256,0.19904088973999023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,512,0.3309760093688965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,128,0.17814221647050646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,12288,128,0.14112888442145452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,12288,32,0.07263733281029595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,256,0.28968000411987305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,64,0.17372088962131074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,32,0.1976026693979899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,16384,3.4419093661838107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,12288,65536,40.24683295355903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,51200,10.638263278537327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,12288,2.7016968197292752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,16384,8.490582784016928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,16384,6.7014863755967875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,65536,14.711820814344618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,10240,2.418421427408854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,10240,4.521673838297526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,12288,5.0250977410210504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,12288,6.0417234632704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,10240,4.124353620741102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,8192,2.213738759358724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,8192,2.659627490573459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,51200,20.979229397243923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,7168,1.4941191143459742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,8192,3.4215395185682507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,6144,1.3859351476033528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,7168,2.2797484927707248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,6144,1.8819590674506292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,5120,1.0935760074191623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,7168,2.8791173299153647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,5120,1.5579653845893011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,4096,0.898564444647895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,6144,2.508212407430013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,51200,25.773515489366318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,4096,1.2473182678222656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,3584,0.7548720041910807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,5120,1.9111111958821614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,3072,0.5884133444892036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,3584,1.116644435458713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,4096,1.4707217746310766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,3584,1.2610613505045574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,2560,0.5221706496344672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,3072,1.025949372185601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,3072,1.0788311428493924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,2048,0.4303573237525092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,2560,0.8037039968702527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,1536,0.3263102107577854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,2560,0.9200337727864584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,1024,0.22420001029968262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,2048,0.7430711322360568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,2048,0.7351608806186252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,1536,0.5805822478400336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,768,0.1797919935650296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,65536,27.559855143229168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,1024,0.3627271122402615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,512,0.13027732902103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,768,0.27189956771002877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,256,0.101656887266371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,1024,0.5135173267788357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,768,0.31863199339972603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,512,0.24078665839301217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,512,0.24615822898017037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,256,0.17139644092983672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,256,0.20070132944318983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,64,0.07166666454739042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,128,0.1523324383629693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,10240,128,0.121960891617669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,32,0.07414399915271334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,64,0.14827911059061685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,32,0.16008888350592718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,1536,0.6075013478597006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,10240,128,0.08913333548439874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,16384,2.739530563354492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,10240,65536,35.19777086046007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,51200,9.340159098307291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,65536,10.248908996582031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,16384,6.711051517062717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,12288,2.0513057708740234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,16384,5.2796202765570746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,10240,1.8208560943603516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,12288,4.153081681993273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,10240,2.8950896792941623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,12288,3.9788559807671438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,8192,1.5602009031507704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,10240,3.1862381829155813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,8192,2.1711226569281683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,7168,1.2866231070624459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,8192,2.4866551293267145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,51200,16.791580200195312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,6144,1.1316471099853516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,7168,1.9029066297743056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,6144,1.6263821919759114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,7168,2.1624266306559243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,5120,0.9542755550808377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,6144,1.8506861792670355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,4096,0.753769768608941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,51200,19.93835279676649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,5120,1.3614408704969618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,5120,1.5501591364542644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,3584,0.5961066881815592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,4096,1.087023099263509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,3072,0.5570000012715658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,3584,0.9563973744710287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,4096,1.5037946701049805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,2560,0.38210132386949325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,3584,1.1070133845011394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,3072,0.8253315819634331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,2048,0.3245448801252577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,65536,21.422826131184895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,1536,0.24974844190809461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,2048,0.5700462129380968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,2560,0.813610659705268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,3072,1.0501609378390842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,2048,0.6660835478040907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,1024,0.18409866756863066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,1536,0.4456133312649197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,768,0.14047911432054308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,1024,0.3101244502597385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,512,0.10711733500162761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,1024,0.36659910943773055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,768,0.23727554745144316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,1536,0.5585546493530273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,768,0.2885119915008545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,256,0.06782755586836073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,128,0.057096891933017306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,512,0.181259552637736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,256,0.1524897813796997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,64,0.04723555511898465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,256,0.148982220225864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,2560,0.6980497572157117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,512,0.2629777855343289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,8192,32,0.049301332897610135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,8192,128,0.10702755716111924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,128,0.12707200315263537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,64,0.12422577540079753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,32,0.12695022424062094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,16384,2.3026453653971353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,8192,65536,28.951416015625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,51200,7.368116590711806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,16384,5.45977062649197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,12288,1.7570977740817602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,65536,10.16805945502387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,16384,5.016310373942058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,12288,3.358005311754015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,10240,1.6196888817681208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,8192,1.2816044489542644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,12288,3.627460479736328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,10240,2.605921851264106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,7168,1.0942470762464735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,10240,2.9410400390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,8192,2.0207706027560763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,8192,2.3172675238715277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,6144,0.790462228986952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,51200,15.661732991536459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,7168,1.768853293524848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,7168,2.0280187394883895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,51200,16.64691162109375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,6144,1.4996621873643663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,5120,0.7263813548617892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,4096,0.5598604414198134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,6144,1.7532559500800238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,5120,1.2621599833170574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,4096,1.0037938223944771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,3584,0.5805466439988878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,5120,1.4671430587768555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,3072,0.4339786635504828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,4096,1.2339359919230144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,3584,0.8895742628309461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,2560,0.3921911186642117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,3584,1.0471341874864366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,3072,1.0563493304782443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,3072,0.9109253353542752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,2048,0.334807104534573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,2560,0.648898654513889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,1536,0.23589245478312174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,2560,0.7698399755689832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,2048,0.5316720008850098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,1024,0.15607999430762395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,768,0.1195253398683336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,1536,0.5364942020840114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,2048,0.6380373107062446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,1536,0.4855946434868707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,1024,0.2877884440951877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,512,0.09574577543470596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,1024,0.3423253430260553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,256,0.06781511174307929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,768,0.2685555617014567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,512,0.16622222794426814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,768,0.2776257726881239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,512,0.20154221852620444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,256,0.13119733333587646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,256,0.13799466027153864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,128,0.06855911016464233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,64,0.04665689004792107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,7168,32,0.05442488855785794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,128,0.10042222340901692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,128,0.11397688918643528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,64,0.10914044247733222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,32,0.10948622226715088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,7168,65536,19.992557101779514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,16384,2.230534235636393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,7168,65536,25.56555684407552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,51200,6.2467600504557295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,12288,1.8264817131890192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,65536,8.723689609103733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,16384,4.520644293891059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,16384,4.499739752875434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,10240,1.652712927924262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,12288,2.852977752685547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,10240,2.334416071573893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,12288,3.2950123680962453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,8192,1.1789467069837782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,7168,0.9963013331095377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,10240,2.7372676001654734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,8192,1.8488453759087458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,8192,2.177276399400499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,6144,0.8248231146070691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,51200,14.930050320095487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,7168,1.6259102291531031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,51200,14.508292304144966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,5120,0.6428497632344564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,7168,1.9136390686035156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,6144,1.3871502346462672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,4096,0.5819546911451552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,5120,1.16593689388699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,4096,0.9310248692830404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,3584,0.46974579493204754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,6144,1.6787956025865343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,5120,1.3896071116129558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,4096,1.1209093729654949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,3072,0.3938675456576877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,3584,0.8200000127156576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,2560,0.3346862263149685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,3072,0.7091857592264811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,3584,0.9879902733696831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,2048,0.29564176665412056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,3072,0.8585626814100477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,2560,0.7934844228956434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,2560,0.725902239481608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,1536,0.22311555014716256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,1024,0.14524355199601915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,2048,0.4902248912387424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,1536,0.3788542217678494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,768,0.10420799917644924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,2048,0.59152799182468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,1024,0.36936532126532656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,512,0.08472800254821777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,1024,0.3210311200883654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,768,0.19882578319973418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,768,0.2485884560479058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,512,0.1616835594177246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,512,0.18657067086961535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,128,0.04547466503249275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,256,0.11753243870205349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,256,0.12594132953219944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,65536,18.547922770182293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,128,0.09393155574798584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,128,0.10082933637830947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,64,0.09567911095089382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,32,0.041160000695122614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,32,0.09600977765189277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,6144,1536,0.4827546543545193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,256,0.05246666736072964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,6144,64,0.0381991101635827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,6144,65536,21.84945000542535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,16384,1.7317084206475153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,51200,5.745982276068793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,16384,3.6266309950086804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,65536,7.210573832194011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,12288,1.3586230807834203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,16384,4.187675476074219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,10240,1.1989662382337782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,12288,2.544320848253038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,10240,2.1153430938720703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,8192,0.958247078789605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,12288,3.0654631720648875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,7168,0.813994672563341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,10240,2.5468177795410156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,8192,1.691744910346137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,6144,0.5592240227593316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,8192,2.051583184136285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,7168,1.5167208777533636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,7168,1.795517391628689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,6144,1.3050915400187175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,5120,0.5357857810126411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,51200,13.139046563042534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,4096,0.48246224721272785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,6144,1.5478560129801433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,5120,1.0693244934082031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,3584,0.3806435532040066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,51200,13.389865451388888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,5120,1.3006951014200847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,4096,0.8712444305419922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,3072,0.31974487834506565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,3584,0.7527475357055664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,2560,0.2791902224222819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,4096,1.152615123324924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,3072,0.6541768709818522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,3584,0.965087996588813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,2048,0.22322132852342394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,3072,0.8584524260626899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,2048,0.45311466852823895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,2560,0.6799519856770834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,1536,0.17939555644989014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,1024,0.11995111571417914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,2048,0.6030124558342828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,1536,0.34741777843899196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,768,0.09276444382137722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,1536,0.4284631146325006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,1024,0.26906577746073407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,1024,0.31393244531419545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,512,0.06747111346986559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,256,0.05322133170233833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,768,0.18085511525472006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,768,0.23015732235378691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,512,0.13665778107113308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,512,0.17338844140370688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,128,0.037399109866884016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,65536,17.28859117296007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,256,0.1146613359451294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,256,0.10559733046425714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,64,0.03504800134234958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,128,0.08183111084832086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,2560,0.5807386504279243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,128,0.08877333005269368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,64,0.08756444189283584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,5120,32,0.08256977796554565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,5120,65536,16.99987962510851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,5120,32,0.0376506679587894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,16384,1.3800631629096136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,51200,3.821356455485026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,16384,3.119130664401584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,12288,0.9124977323744031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,65536,5.329449971516927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,16384,3.820166269938151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,10240,0.9099608527289497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,12288,2.294189241197374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,8192,0.7362115648057727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,12288,2.851461410522461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,10240,1.9344204796685114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,7168,0.6109946568806967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,10240,2.383265813191732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,8192,1.5646240446302626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,8192,1.9164248572455511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,6144,0.5489164458380805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,7168,1.3846399519178603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,5120,0.4172622097863092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,7168,1.6801022423638239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,6144,1.163904931810167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,4096,0.34532888730367023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,5120,1.022121747334798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,6144,1.472007115681966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,5120,1.2153316073947482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,3584,0.27649421162075466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,51200,11.975943671332466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,3072,0.23883467250400117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,4096,0.8113742404513888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,3584,0.6886364618937174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,4096,0.9822497897677951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,51200,12.217655605740019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,2560,0.20769333839416504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,3584,0.8984781901041666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,3072,0.6697262128194174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,2048,0.19017244709862602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,3072,0.7543955379062228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,2560,0.5025919808281792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,1536,0.14254489209916857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,1024,0.09123644563886855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,2048,0.41183288892110187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,2560,0.6337573263380263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,1536,0.3157342274983724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,768,0.07473866807089911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,2048,0.5222844547695583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,1536,0.3989288806915283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,1024,0.261790222591824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,1024,0.27667466799418133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,768,0.16239733166164821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,256,0.03631555702951219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,768,0.2117475536134508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,512,0.1210977766248915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,128,0.030265778303146362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,512,0.17392533355289033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,256,0.10348444514804417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,256,0.09099288781483968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,64,0.028488000233968098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,32,0.026370666093296472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,128,0.07307822174496122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,128,0.07534666856129964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,65536,14.405788845486112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,64,0.06911110877990723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,4096,32,0.06896889209747314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,4096,512,0.049419555399152965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,4096,65536,15.537284003363716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,16384,1.4289617538452148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,51200,4.542302025689019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,16384,2.9286552005343967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,65536,5.237494998508029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,12288,0.9829048580593533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,10240,0.8488808737860786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,12288,2.1835803985595703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,16384,3.6834754943847656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,8192,0.6352782249450684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,12288,2.7597512139214406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,10240,1.8514968024359808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,7168,0.5402284198337132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,8192,1.4769226710001628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,10240,2.3015609317355685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,6144,0.46685510211520725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,51200,10.061520046657986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,7168,1.3242915471394856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,5120,0.3692773448096381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,7168,1.625069300333659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,6144,1.1334408654106987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,8192,1.8556647830539281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,4096,0.32957421408759224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,6144,1.4017581939697266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,3584,0.26998400688171387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,5120,0.957024892171224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,4096,0.7433795399136014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,5120,1.174939579433865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,3072,0.23430932892693412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,4096,0.9869546890258789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,51200,11.572469923231337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,3584,0.6641208860609267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,2560,0.21159644921620688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,3584,0.8403742048475477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,3072,0.5665751033359104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,2048,0.16434133052825928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,1536,0.12529688411288792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,2560,0.47939380009969074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,3072,0.7320764329698352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,2560,0.6148204273647732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,2048,0.3904595639970567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,1024,0.08813244766659206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,2048,0.49910132090250653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,1536,0.319392893049452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,768,0.06798933611975776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,512,0.05000088943375481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,1024,0.2059048944049411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,1024,0.26538578669230145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,768,0.15308711263868544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,1536,0.3848959869808621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,256,0.033089776833852134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,768,0.20841599835289848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,128,0.029968000120586816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,65536,14.296744452582466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,512,0.11381867196824814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,512,0.15048800574408636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,256,0.09834577639897664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,256,0.08341511090596516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,32,0.026986666851573523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3584,64,0.02995022137959798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,128,0.06880178054173787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,128,0.06950133376651339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,64,0.0625857777065701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3584,32,0.060601777500576444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3584,65536,14.911683824327257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,16384,1.0546888775295682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,51200,3.3827991485595703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,16384,2.790312872992622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,12288,0.8241235415140787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,65536,4.54532708062066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,16384,3.5229494306776257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,10240,0.6337297757466634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,12288,2.0797661675347223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,8192,0.45043468475341797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,10240,1.7415786319308812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,12288,2.6543074713812933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,10240,2.2194319831000433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,7168,0.4347555637359619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,8192,1.403657807244195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,6144,0.3321146700117323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,8192,1.780686272515191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,7168,1.2249084048800998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,5120,0.3340906567043728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,7168,1.5799822277492945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,6144,1.068460464477539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,4096,0.22072177463107637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,51200,10.054373847113714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,6144,1.3477768368191188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,5120,0.9732809066772461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,3584,0.22224977281358507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,5120,1.133917384677463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,4096,0.7178506851196289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,3072,0.1958622270160251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,3584,0.6222453117370605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,4096,0.9220061832004123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,2560,0.16938489013248018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,3584,0.824393802218967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,3072,0.5369555685255263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,2048,0.13531111346350774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,51200,11.087066650390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,2560,0.45393864313761395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,3072,0.7115431361728244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,1536,0.10131911436716716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,2048,0.36860889858669704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,2560,0.6062106556362575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,65536,11.733308580186632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,1024,0.07354933023452759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,768,0.057987557517157666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,2048,0.4793990982903375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,1536,0.3683191140492757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,1024,0.19525510734981963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,512,0.043206221527523465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,1024,0.2534444332122803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,768,0.14396266142527261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,256,0.028844445943832397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,512,0.1056835585170322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,768,0.19407288233439127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,512,0.14288000265757242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,256,0.07620977693133883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,128,0.023919999599456787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,256,0.09244000249438816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,64,0.020668443706300523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,3072,32,0.021288888321982488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,128,0.06442044178644817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,128,0.06265422370698717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,64,0.05567555295096504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,32,0.05391110976537069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,3072,1536,0.28358401192559135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,3072,65536,14.237657335069445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,16384,0.8302551375495063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,51200,2.9571102990044484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,65536,3.6871367560492625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,12288,0.6936622195773654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,16384,2.621950149536133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,10240,0.5578568776448568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,12288,1.9626276228162978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,16384,3.399690628051758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,8192,0.4416951073540582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,12288,2.5602071550157333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,10240,1.661219596862793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,7168,0.38393510712517637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,8192,1.335468398200141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,10240,2.1408329010009766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,6144,0.31223376592000324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,8192,1.7189359664916992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,7168,1.1899048487345378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,51200,8.85330115424262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,5120,0.2593795458475749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,6144,1.0028257369995117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,7168,1.5110684500800238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,4096,0.2239840030670166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,6144,1.299642668830024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,3584,0.19162400563557944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,5120,0.834927135043674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,4096,0.6689466900295682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,3072,0.17446577548980713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,5120,1.133548418680827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,4096,0.9001280466715494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,2560,0.1365235514110989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,3584,0.7762986818949381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,3072,0.5271653069390191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,65536,11.10101318359375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,2048,0.11380444632636176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,3072,0.6722630924648709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,2560,0.43008356624179417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,1536,0.09255911244286431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,2560,0.5656648741828071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,51200,10.659972296820746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,1024,0.059966219796074756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,1536,0.2676924334632026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,2048,0.3554862340291341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,2048,0.46998755137125653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,768,0.04635555545488993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,512,0.03543466660711501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,3584,0.6045751041836208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,1024,0.18239377604590523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,1024,0.24246401256985137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,768,0.13640177249908447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,256,0.024724443753560383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,768,0.18593955039978027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,128,0.021512000097168818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,512,0.09829155604044597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,512,0.1352364487118191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,64,0.019653333557976615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,256,0.06930400265587701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,256,0.08768444591098362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2560,32,0.020248000820477802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,128,0.059991108046637646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,128,0.055733336342705615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,64,0.049011554982927114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2560,32,0.0471093323495653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,1536,0.35440977414449054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,16384,0.7184231016370984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2560,65536,13.627667744954428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,51200,2.3833190070258246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,65536,3.008823182847765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,12288,0.57332886589898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,16384,2.4637012481689453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,10240,0.4160346719953749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,12288,1.8531778123643663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,16384,3.2570586734347873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,12288,2.454630321926541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,8192,0.33702399995591903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,10240,1.5436951319376628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,8192,1.257941351996528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,10240,2.050811555650499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,7168,0.31644177436828613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,6144,0.25625954733954537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,51200,8.048960367838541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,8192,1.6458347108629015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,7168,1.0878417756822374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,5120,0.20218577649858263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,7168,1.4474301868014867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,6144,0.9677644305759006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,4096,0.18171466721428764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,5120,0.7833929061889648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,3584,0.1617057720820109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,6144,1.2445910771687825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,5120,1.0628275341457791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,4096,0.6308488845825195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,3072,0.12415288554297553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,4096,0.8756506707933215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,65536,10.11062706841363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,2560,0.10285955667495728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,3072,0.4791706403096517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,3584,0.7415591345893012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,2048,0.08897599909040664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,51200,10.141983879937067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,3072,0.6421706411573622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,1536,0.07246310843361749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,2560,0.5421093304951986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,2048,0.3278142346276177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,1536,0.25138666894700795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,1024,0.047535998953713306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,2048,0.4394853379991319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,768,0.03637866510285272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,1536,0.3381928867763943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,1024,0.16962756050957573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,512,0.02646044393380483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,768,0.1255964438120524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,1024,0.23055643505520293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,768,0.175291551484002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,256,0.019564444820086162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,128,0.015627556376987033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,3584,0.6012924512227377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,512,0.09024622042973836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,512,0.12731556097666422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,256,0.08166044288211398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,64,0.014690667390823364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,2048,32,0.015332443846596612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,128,0.04919644527965122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,128,0.05554133322503832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,64,0.04213066564665901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,32,0.038909332619773015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,2560,0.404038217332628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,2048,256,0.06273955769009061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,16384,0.4772888819376628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,2048,65536,13.03551059299045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,51200,1.8058391147189672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,65536,2.2979208628336587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,12288,0.4394035604265001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,16384,2.3066889444986978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,12288,1.742712868584527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,10240,0.3324017789628771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,12288,2.3663999769422746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,16384,3.1450089348687063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,8192,0.2807119952307807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,10240,1.4495813581678603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,7168,0.21338400575849745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,8192,1.1655129326714408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,10240,1.978457768758138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,6144,0.20201599597930908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,8192,1.5935982598198786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,7168,1.0272319581773546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,5120,0.16715910699632433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,51200,7.359259711371528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,6144,0.8897138171725802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,7168,1.3954764472113714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,4096,0.14636622534857854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,5120,0.7441742155287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,6144,1.1990426381429036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,3584,0.11416888236999512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,4096,0.5917741987440321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,3072,0.10609155231051975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,5120,1.0044221878051758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,3584,0.51982667711046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,4096,0.8100524478488498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,2560,0.0875928865538703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,3584,0.7197350925869412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,2048,0.07586133480072021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,3072,0.449560006459554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,2560,0.3780666722191705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,1536,0.05312444435225593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,3072,0.6156551043192545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,2560,0.5183724297417535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,2048,0.30686844719780815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,65536,9.42411126030816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,1024,0.03738222188419766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,768,0.029622223642137315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,2048,0.4223733213212755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,1536,0.23334754837883842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,1024,0.1564684444003635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,1536,0.32340976927015513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,512,0.02118844456142849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,1024,0.21910222371419272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,768,0.11462488439348008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,256,0.015238222148683337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,768,0.16668889257642958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,128,0.013413333230548434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,512,0.1202195617887709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,256,0.055890666113959424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,256,0.07595111264122857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,64,0.012421333127551608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,128,0.04128088884883457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,128,0.05135022269354927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1536,32,0.012896888785892062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,51200,9.745967441134983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,64,0.0350888901286655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,32,0.03194488750563727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1536,512,0.08254755867852105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,51200,1.2500186496310763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,65536,1.4787911309136286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,16384,0.4277377658420139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,12288,0.304928011364407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1536,65536,12.495243496365019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,16384,2.1591199239095054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,10240,0.2310160001118978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,12288,1.6275635825263128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,16384,2.9901084899902344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,12288,2.2509689331054688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,10240,1.3605022430419922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,10240,1.8812079959445531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,8192,1.0863591300116646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,7168,0.1563484403822157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,8192,0.17696711752149794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,6144,0.13834577136569554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,8192,1.5098408593071833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,51200,6.750196244981553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,7168,0.9523839950561523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,6144,0.8207271364000109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,5120,0.11496799521976048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,4096,0.09194933043585883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,7168,1.3258213467068143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,5120,0.6852613555060493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,3584,0.07782489061355591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,4096,0.5514266755845811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,6144,1.1406195958455403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,3072,0.0691173341539171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,5120,0.9560826619466146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,4096,0.7703955438401965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,2560,0.05676266882154676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,3584,0.4843920071919759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,3072,0.41800710890028214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,3584,0.6768764389885796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,65536,8.682533264160156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,2048,0.0450817777050866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,2560,0.35132267740037704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,1536,0.03405244482888116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,3072,0.5852079921298557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,1024,0.025462221768167283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,2560,0.4917484389411078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,2048,0.28490132755703396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,768,0.02001333402262794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,1536,0.21636444992489287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,1024,0.1435262229707506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,1536,0.30647023518880206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,512,0.013903111219406128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,2048,0.40040087699890137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,1024,0.20572888851165771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,256,0.01203644441233741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,768,0.15586222542656794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,512,0.07318488756815593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,128,0.010044444766309526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,256,0.0704524450831943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,256,0.04713066750102573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,64,0.00999111102686988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,128,0.04555022385385302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,128,0.03382844395107693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,64,0.027792887555228338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,32,0.02536711096763611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,51200,9.290700276692709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,1024,768,0.10516977972454494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,512,0.11158222622341579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,65536,1.0381120045979817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,1024,32,0.010041777458455827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,16384,0.29852623409695095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,51200,0.8482560051812066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,12288,0.2463146580590142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,1024,65536,11.874113294813368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,16384,2.084606170654297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,10240,0.16943732897440592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,12288,1.589351971944173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,16384,2.9478265974256725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,8192,0.13609333833058676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,12288,2.2152693006727433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,10240,1.3093751271565754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,7168,0.12746755282084146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,10240,1.8512115478515625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,8192,1.0476453569200304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,7168,0.9248950746324328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,8192,1.4854488372802734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,6144,0.10775111118952434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,7168,1.3044071197509766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,6144,0.7896693547566732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,5120,0.09094666772418553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,4096,0.06890577740139432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,6144,1.1239315668741863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,51200,6.501243591308594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,3584,0.0632986691262987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,5120,0.6606613265143501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,4096,0.5321475664774576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,3072,0.05099733339415657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,3584,0.4668320020039876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,5120,0.9401404062906901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,4096,0.7585422197977701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,2560,0.04957688848177592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,65536,8.319962395562067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,3072,0.40196800231933594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,3584,0.6653813256157769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,2048,0.03593066665861342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,2560,0.33913066652086044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,1536,0.02964977754486932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,3072,0.5744817521837022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,1024,0.019796444310082328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,2560,0.48377423816257054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,2048,0.273693323135376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,768,0.015384000208642749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,1536,0.2086906698015001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,2048,0.3916791015201145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,1536,0.3000008794996473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,512,0.012072000238630505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,1024,0.1372737752066718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,1024,0.2019066678153144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,768,0.10007466872533162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,768,0.15204621685875788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,512,0.0694755580690172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,512,0.10947999689314102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,256,0.0431600014368693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,64,0.01000355515215132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,128,0.030488000975714788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,32,0.008447111480765873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,64,0.02439822256565094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,768,32,0.02239822182390425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,51200,9.157432556152344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,256,0.009342222577995723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,65536,0.7718470891316732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,768,128,0.00867911097076204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,256,0.068667557504442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,128,0.043581333425309926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,16384,0.17123288578457305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,51200,0.5609271261427138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,12288,0.1559528907140096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,768,65536,11.716403537326388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,16384,2.004598193698459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,12288,1.5152124828762477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,10240,0.11676622761620416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,16384,2.8734177483452688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,8192,0.09751288758383857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,12288,2.1615678999159074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,10240,1.2579982545640733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,7168,0.08384711212582058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,10240,1.8026960160997179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,8192,1.0099769168429904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,6144,0.070433775583903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,7168,0.8851173188951281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,8192,1.447946654425727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,5120,0.06424711147944133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,6144,0.7613315582275391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,7168,1.2693324618869357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,4096,0.051494220892588295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,6144,1.0921555625067818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,5120,0.6367991235521104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,3584,0.04153955645031399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,4096,0.5123253398471409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,5120,0.9162123998006185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,3072,0.03879288832346598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,51200,6.267642550998264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,3584,0.449386649661594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,2560,0.03246311015552945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,4096,0.7370577918158637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,3072,0.3873422145843506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,2048,0.025267556309700012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,3584,0.6479377746582031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,2560,0.3260408772362603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,1536,0.019928000039524503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,3072,0.5593528747558594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,2560,0.4702924622429742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,65536,8.003728230794271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,1024,0.014478221535682678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,2048,0.2634426752726237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,768,0.011695110963450538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,1536,0.20051466094122994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,2048,0.3807724316914876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,512,0.010039110978444418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,1536,0.2918817732069227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,1024,0.1947573290930854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,1024,0.13185155391693115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,768,0.1471208863788181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,512,0.10534489154815674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,512,0.06604533063040839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,128,0.006664000037643645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,256,0.03761511047681173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,256,0.06355466445287068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,64,0.0069644442862934535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,128,0.027121777335802715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,128,0.041096889310412936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,32,0.007254222200976477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,64,0.02127644419670105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,32,0.0192586663696501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,65536,0.42903910742865664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,512,768,0.09517155753241645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,51200,0.344327105416192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,51200,8.942972819010416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,16384,0.10833066701889038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,512,256,0.007310222420427535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,12288,0.08265955580605401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,512,65536,11.421111212836372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,16384,1.9335617489284938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,10240,0.06730222039752536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,12288,1.4512391620212133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,10240,1.2126426696777344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,16384,2.7937022315131297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,8192,0.05459022190835741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,12288,2.103027555677626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,7168,0.05013688736491733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,10240,1.7538248697916667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,8192,0.9739377763536242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,6144,0.042287998729281955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,8192,1.4107501771714952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,7168,0.8542950948079427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,5120,0.035353776481416486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,6144,0.7332337697347006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,7168,1.2350293265448677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,4096,0.03160266743765937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,51200,6.028947618272569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,5120,0.6138461960686578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,3584,0.02626133296224806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,6144,1.064889801873101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,5120,0.890742195977105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,3072,0.024168888727823894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,4096,0.4931519826253255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,3584,0.4337608814239502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,4096,0.7177528805202908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,2560,0.017678222722477384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,65536,7.704793294270833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,3584,0.6314204533894857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,3072,0.37308621406555176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,2048,0.014947555131382413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,1536,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,3072,0.5433795717027452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,2560,0.31316712167527944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,1024,0.009301332963837517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,2048,0.2537599934471978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,2560,0.45769066280788845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,768,0.007948444121413762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,2048,0.37001776695251465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,1536,0.28296176592508954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,1024,0.1269786622789171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,512,0.006911110960774952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,1024,0.1884382168451945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,768,0.09080355697207981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,256,0.005598222215970357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,768,0.14221955670250788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,128,0.004883555488453971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,512,0.06287022431691487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,512,0.10115822156270345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,256,0.060031109386020236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,256,0.03452444407675002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,32,0.004599110947714912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,128,0.038718223571777344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,128,0.023992000354660883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,64,0.01828533411026001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,32,0.016376889414257474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,65536,0.334386666615804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,51200,0.25733333163791233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,256,1536,0.19242666827307808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,16384,0.0848391122288174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,51200,8.68571048312717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,256,64,0.004268444246715969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,12288,0.06667644447750516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,256,65536,11.122885810004341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,12288,1.4289973576863606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,16384,1.9023778703477647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,10240,0.054924445019827954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,16384,2.7625066969129772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,8192,0.04840355449252658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,10240,1.193394660949707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,10240,1.7354426913791234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,12288,2.078000810411241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,7168,0.04064711266093784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,8192,0.9581964280870227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,6144,0.03482755687501695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,8192,1.395584848192003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,7168,0.8395573298136393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,5120,0.03042222062746684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,6144,0.7218862109714084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,7168,1.2207715776231554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,4096,0.02805244591501024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,51200,5.91992908053928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,5120,0.6035368707444932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,6144,1.0518230862087674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,3584,0.022132444712850783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,5120,0.8789671262105306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,4096,0.7075031068589953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,3072,0.015569777952300178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,3584,0.4264551003774007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,3584,0.6219280030992296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,2560,0.01109777804878023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,65536,7.576645745171441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,3072,0.3675119876861572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,2048,0.008976000050703684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,3072,0.5368471145629883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,4096,0.4856533474392361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,1536,0.00795377790927887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,2560,0.3083333439297146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,1024,0.006302222195598815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,2048,0.2489324410756429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,2560,0.4502311282687717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,1536,0.1888435549206204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,1024,0.12378756205240886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,2048,0.3646719985538059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,768,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,1536,0.2784133222368029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,512,0.005199111170238919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,1024,0.18472799989912245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,256,0.0042204442951414315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,768,0.08957155545552571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,512,0.061068442132737905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,128,0.003910222401221593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,256,0.058054222000969775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,256,0.03259733319282532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,64,0.0035546666218174826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,128,32,0.0038319999972979226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,128,0.022346667117542688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,64,0.01682400041156345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,128,32,0.015491555134455362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,65536,0.32291467984517414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,51200,0.251672003004286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,16384,0.08260622289445665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,512,0.09861955377790664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,12288,0.06361689170201619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,51200,8.588088141547308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,10240,0.053787555959489614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,768,0.1391599973042806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,65536,10.998917473687065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,8192,0.04750755429267883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,16384,1.891323513454861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,7168,0.03926577832963731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,6144,0.03385688861211141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,12288,1.4202470779418945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,5120,0.029703110456466675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,10240,1.188352902730306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,4096,0.02455644475089179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,6144,0.7169360054863824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,7168,0.8348168796963162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,3584,0.021911111142900255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,8192,0.9543635050455729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,3072,0.013721778160995908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,2560,0.009724444813198512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,4096,0.48324002159966367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,2048,0.00943288869327969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,3584,0.4236080116695828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,3072,0.36520711580912274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,1536,0.00832266691658232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,1024,0.006301333506902059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,2048,0.24716001086764863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,768,0.005610666755172942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,1536,0.18695910771687826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,1024,0.12203021844228108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,512,0.005026666654480828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,256,0.0042453333735466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,768,0.0875955555174086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,128,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,512,0.06002489063474867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,64,0.0035377778112888336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,5120,0.5994835429721409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,128,0.021486222743988037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,64,32,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,64,0.015863110621770222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,32,0.014488000008794995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,2560,0.30560443136427135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,65536,0.35969866646660703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,51200,0.26860178841484916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,16384,0.07960266537136503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,12288,0.060883555147382945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,256,0.031926221317715116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,10240,0.05125244458516439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,51200,5.882280985514323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,8192,0.045239110787709556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,12288,1.4202871322631836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,7168,0.03734133309788174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,10240,1.1872186660766602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,16384,1.8943528069390192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,6144,0.03256355391608344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,5120,0.028417779339684382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,8192,0.9539066950480143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,4096,0.025232000483406916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,64,65536,7.526678297254775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,3584,0.02446577780776554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,7168,0.8349262343512641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,5120,0.6001591152615017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,6144,0.7186746597290039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,3072,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,4096,0.4827866554260254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,2560,0.008960888617568547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,2048,0.0076044441925154785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,3584,0.42623289426167804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,2560,0.3086000018649631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,3072,0.3682968881395128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,1536,0.006518222391605377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,2048,0.2488551139831543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,1024,0.005225777626037598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,1024,0.12395644187927246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,768,0.08880888753467137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,512,0.004171555654870139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,256,0.0034888887570963967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,512,0.06057955821355184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,256,0.031888888941870794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,128,0.003145777723855443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,64,0.0031519999934567344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,128,0.021436444587177698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,64,0.016178665889634024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,32,0.013880000346236758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,768,0.004886222382386525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,1536,0.1892862187491523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16384,32,32,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,51200,5.876936170789931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16384,32,65536,7.531029595269097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,16384,10.789899190266928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,12288,8.33804236518012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16384,128,128,0.0380711125002967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,16384,13.583652072482638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,10240,6.820176018608941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,16384,19.254613240559895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,12288,10.034574720594618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,12288,11.833108690049913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,8192,5.173915439181857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,10240,8.562713623046875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,10240,8.00018056233724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,8192,6.205665588378906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,8192,6.097039964463975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,7168,4.445151011149089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,7168,4.796866522894965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,51200,32.56134033203125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,6144,4.1671324835883246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,5120,3.1654879252115884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,7168,5.029735989040799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,6144,4.3859375847710504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,6144,4.281592898898654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,5120,3.474415037367079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,4096,2.5330382453070746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,4096,2.829704920450846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,5120,3.5021288130018444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,4096,2.9666951497395835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,3584,2.4710551367865667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,3584,2.491905848185221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,3584,2.5616533491346574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,3072,2.0338107215033636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,3072,2.190371619330512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,3072,2.239264806111654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,2560,1.7006977929009333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,2560,1.7312008539835613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,2048,1.384378645155165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,2048,1.486660427517361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,1536,1.0151946809556749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,2560,1.852661344740126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,1536,1.094598240322537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,1024,0.6996915605333117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,2048,1.5193227132161458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,768,0.4859520064459906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,1024,0.8495182461208768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,1024,0.8037066459655762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,512,0.39324087566799587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,768,0.6909244325425891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,768,0.8933813307020398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,512,0.5328790876600478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,256,0.33455822202894425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,512,0.5324071248372396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,128,0.2091991106669108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,256,0.49515824847751194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,256,0.4016871187422011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,1536,1.1444062127007377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,64,0.19764533307817247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,128,0.29828355047437877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,128,0.5195040173000759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,65536,32,0.19617422421773276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,64,0.4592862129211426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,32,0.4761981964111328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,65536,51200,49.862263997395836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,16384,8.28804694281684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,65536,51200,66.02853732638889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,51200,25.30373975965712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,12288,6.2631420559353295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,65536,32.103613959418404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,16384,10.965327792697481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,16384,15.06480746799045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,10240,5.216039869520399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,12288,7.815617031521267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,12288,9.85467783610026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,10240,6.775354597303603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,8192,4.574094136555989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,10240,6.46524895562066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,8192,4.572206285264757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,8192,4.709281921386719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,7168,3.4682952033148875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,7168,4.026024712456597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,7168,4.1499654981825085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,6144,3.318507512410482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,51200,52.5126478407118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,6144,3.4466834598117404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,5120,2.457572513156467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,4096,2.1638196309407554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,6144,3.561792161729601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,65536,49.876129150390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,5120,2.7285039689805775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,5120,2.911924362182617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,4096,2.2773005167643228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,3584,2.0215494367811417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,3584,1.924197302924262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,3584,2.0333084530300565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,4096,2.3250844743516708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,3072,1.9425680372450087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,3072,1.674712922837999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,2560,1.355384932623969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,2048,1.173259523179796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,2560,1.4626373714870875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,3072,1.7879361046685114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,2560,1.4649733437432184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,2048,1.1617039574517143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,1024,0.5215484301249186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,1536,0.8850488662719727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,1536,0.9118764665391711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,1024,0.6640311347113715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,2048,1.1862701839870877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,1536,0.9302355448404948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,768,0.4386906623840332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,512,0.3038640022277832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,768,0.5184648831685384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,768,0.5246222284105089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,256,0.2839199966854519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,1024,0.7729102240668403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,512,0.44620709949069554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,128,0.2171386612786187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,512,0.5981261995103624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,256,0.3783128791385227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,256,0.34425155321757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,128,0.384735107421875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,64,0.16899466514587402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,51200,32,0.15299199687110052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,128,0.24058845308091906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,64,0.37682223320007324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,32,0.3811004426744249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,51200,65536,69.72144911024306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,51200,7.959031846788194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,65536,10.008227030436197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,16384,2.837711970011393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,12288,1.9247830708821614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,16384,5.4892730712890625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,16384,4.209159851074219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,51200,14.06019507514106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,12288,3.4239963955349393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,10240,1.859823015001085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,12288,3.2552142673068576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,8192,1.2779760360717773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,10240,2.359158198038737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,10240,2.5971298217773438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,51200,18.87316724989149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,8192,1.827538596259223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,7168,1.0816177792019315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,65536,17.756798638237846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,8192,1.9643431769476996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,6144,0.9524941974216037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,7168,1.5445120069715712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,6144,1.3221377266777885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,5120,0.8592737515767416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,7168,1.7169289059109156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,5120,1.127229372660319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,6144,1.383048905266656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,4096,0.621321784125434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,5120,1.1524133682250977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,3584,0.523980458577474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,4096,1.0638533698187935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,4096,0.9384533564249674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,3072,0.4897022247314453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,3584,0.7750026914808484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,3584,0.8449466493394641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,3072,0.7390640046861437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,2048,0.3140924506717258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,3072,0.6992613474527994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,2560,0.5920560095045302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,2560,0.6837395562065972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,1536,0.25200621287027997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,2048,0.450816896226671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,1536,0.34478221999274355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,1024,0.18239466349283853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,2048,0.5116906695895725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,768,0.14124622609880236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,1024,0.2517288790808784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,1536,0.38457332717047793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,1024,0.27128177218967015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,512,0.09535555707083808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,768,0.2033440007103814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,2560,0.41569243537055117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,768,0.26800444391038686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,256,0.07334666781955294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,512,0.17350310749477812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,512,0.16041599379645452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,128,0.05745244688457913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,64,0.04774844315316942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,256,0.13981333043840197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,16384,128,0.09678400225109524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,128,0.12462045086754693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,16384,32,0.05127822359402975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,64,0.12618577480316162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,32,0.13038133250342474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,65536,25.662355211046005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,16384,256,0.1368053356806437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,16384,2.225876490275065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,51200,51200,40.07478162977431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,51200,6.438321007622613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,65536,8.190979851616754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,16384,4.366604275173612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,12288,1.6742337544759114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,16384,3.361999087863498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,10240,1.606686274210612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,10240,1.9781413608127172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,12288,2.781805250379774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,12288,2.589235517713759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,8192,1.2332835727267795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,10240,2.1284684075249567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,8192,1.4752160178290472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,7168,0.9622266557481555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,8192,1.5947724448310003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,6144,0.8213173548380533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,7168,1.27637693617079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,51200,11.978314717610678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,7168,1.3987982008192275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,6144,1.0655653211805556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,5120,0.5846106741163466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,4096,0.45662842856513125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,6144,1.1601111094156902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,5120,0.9264461729261609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,5120,0.9742701848347982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,4096,0.9192507002088758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,3584,0.4330844349331326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,4096,0.8018488883972168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,3072,0.35467643207973903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,3584,0.6198088857862685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,65536,14.504457261827257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,2560,0.286497778362698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,3584,0.6874266730414497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,3072,0.6561688847011989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,2560,0.45507023069593644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,2048,0.26350400182935924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,3072,0.5974159770541722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,1536,0.17888177765740287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,2048,0.3677066697014703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,2560,0.5872142050001357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,1024,0.13359910911983913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,1536,0.314608891805013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,768,0.11635733975304498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,1024,0.2038631174299452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,1024,0.23410132196214464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,512,0.07564355267418756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,768,0.16066400210062662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,768,0.21858133210076225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,256,0.05201422174771627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,512,0.1458559963438246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,512,0.13081955909729004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,128,0.043952001465691455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,256,0.1061626672744751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,256,0.11609244346618652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,64,0.03823466764556037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,128,0.0803955528471205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,128,0.0977333320511712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,12288,32,0.03941599859131707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,64,0.1002017789416843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,32,0.10157422224680583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,12288,2048,0.4147840076022678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,1536,0.3813217745886908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,51200,14.648857964409721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,12288,65536,20.11889139811198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,16384,1.7400773366292317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,51200,5.265515645345052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,16384,3.035145865546333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,16384,3.801408131917318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,65536,6.7001554701063375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,12288,1.413321812947591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,10240,1.163837326897515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,12288,2.370751063028971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,10240,1.7837005191379125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,12288,2.3011351691351996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,8192,0.8379351298014323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,10240,1.881954616970486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,7168,0.7998568746778699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,8192,1.2902453740437825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,8192,1.4445084465874567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,6144,0.6420568890041775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,7168,1.1233626471625435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,51200,9.960631476508246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,6144,0.9524186452229818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,7168,1.2616613176133897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,5120,0.5160213576422797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,4096,0.46335734261406797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,6144,1.1273991266886394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,5120,0.7904799779256185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,5120,0.8878400060865613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,3584,0.33884355756971574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,51200,12.656342400444878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,4096,0.8388089074028863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,4096,0.7128782272338867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,3072,0.2953502337137858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,3584,0.5555831061469184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,2560,0.24437244733174643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,3584,0.6472764545016819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,3072,0.48416535059611004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,2048,0.21508977148267958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,3072,0.5438222355312771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,2560,0.4055439896053738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,1536,0.15648799472384983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,2048,0.3277662330203586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,2560,0.4934870931837294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,1024,0.12063199943966335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,1536,0.24763467576768664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,1536,0.286719110276964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,768,0.09242933326297337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,512,0.06392800145679049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,1024,0.17989067236582437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,1024,0.21220178074306914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,768,0.1420560015572442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,768,0.16901777850257027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,65536,13.798444112141928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,256,0.047100444634755455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,128,0.03754399882422553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,512,0.12628444035847983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,512,0.13172622521718344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,64,0.039417776796552874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,256,0.0944675538274977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,128,0.08472977744208442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,10240,32,0.04127555423312717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,256,0.11752800146738689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,64,0.08415377802318996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,32,0.08650577730602688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,2048,0.3724257681104872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,10240,128,0.07192977931764391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,10240,65536,16.71753099229601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,16384,1.3660098181830511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,51200,4.089128706190321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,65536,5.10823737250434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,16384,3.2052319844563804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,12288,1.0582062403361003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,16384,2.695506625705295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,10240,0.997372415330675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,12288,2.012055926852756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,10240,1.458440038892958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,12288,2.0222479502360025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,8192,0.751198238796658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,10240,1.6755155987209742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,8192,1.118391990661621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,7168,0.7433973418341743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,8192,1.2881057527330186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,6144,0.4920488993326823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,7168,0.9898711310492622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,7168,1.1042488945855033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,6144,0.8299742274814181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,5120,0.42462754249572754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,51200,8.669979519314236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,4096,0.3323422273000081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,5120,0.6965137587653266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,6144,0.9650586446126302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,4096,0.5901546478271484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,5120,0.7868755658467611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,3584,0.27732978926764595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,51200,10.619741651746962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,3072,0.2495288848876953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,4096,0.6753342416551379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,2560,0.21440888775719535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,3584,0.5698524581061469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,3072,0.5041306813557943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,2048,0.1670044395658705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,2560,0.3615769015418158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,1536,0.12003200583987766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,2048,0.2860293388366699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,2560,0.5207360055711534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,2048,0.3460871113671197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,1536,0.22297512160407174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,1536,0.2573973337809245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,3584,0.48678133222791886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,768,0.07500266366534762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,1024,0.19008444415198433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,512,0.05162400007247925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,3072,0.4336160024007161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,768,0.12350666522979736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,768,0.1506942245695326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,256,0.037335998482174344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,512,0.09891021913952297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,512,0.11808533138699001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,128,0.030976000759336684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,256,0.08448266983032227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,256,0.08022666639751859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,64,0.025447110335032146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,128,0.07103200091256036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,32,0.026365333133273657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,64,0.07007644573847453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,32,0.07266933388180204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,8192,1024,0.08603911267386542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,1024,0.15785955058203802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,65536,11.767277187771269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,8192,65536,13.977997673882378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,8192,128,0.06364177995257907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,16384,1.2466826968722873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,51200,4.479984707302518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,65536,5.077709197998047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,16384,2.6620640224880643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,16384,2.527234607272678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,12288,1.10826661851671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,10240,0.8064124319288465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,12288,1.686764399210612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,12288,1.8480044470893011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,10240,1.3359528647528753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,8192,0.649454222785102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,10240,1.5535084406534831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,8192,1.009229342142741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,7168,0.6348622110154893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,6144,0.4928462240431044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,8192,1.2058204015096028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,7168,0.8950995339287652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,51200,8.86118910047743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,7168,1.0372195773654513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,51200,8.084713406032986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,5120,0.38748976919386124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,6144,0.7848258018493652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,4096,0.30616532431708443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,6144,0.8919920391506619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,5120,0.6531190872192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,4096,0.5733484692043728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,3584,0.2865600056118435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,5120,0.7485395537482368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,4096,0.6101484298706055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,3584,0.4533368746439616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,3072,0.22839644220140246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,2560,0.1966266632080078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,3072,0.42985955874125165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,2048,0.15439911683400473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,3072,0.4666568968031142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,2560,0.3315822283426921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,3584,0.5368213123745388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,2560,0.40539733568827313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,1536,0.12611999776628283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,1024,0.08455200327767266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,2048,0.2729537751939562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,1536,0.20078044467502168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,65536,10.295521206325954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,1536,0.24314755863613555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,2048,0.33709332678053117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,1024,0.14352888531155056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,768,0.06924088795979817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,1024,0.17950667275322807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,512,0.05604888995488485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,256,0.040320889817343816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,128,0.030351112286249798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,768,0.11420355902777778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,512,0.1170382234785292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,512,0.09170933564503987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,256,0.07956800195905897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,256,0.07152089145448473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,64,0.026760000321600173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,7168,32,0.026724444495307073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,128,0.05940710835986667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,64,0.06237155861324734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,32,0.06083910995059543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,7168,768,0.15271111329396567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,65536,12.771525065104166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,7168,128,0.0626044472058614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,16384,1.117699517144097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,51200,3.212124506632487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,16384,2.228849834865994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,65536,3.939070383707682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,12288,0.9266569349500867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,10240,0.6845582326253256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,16384,2.309671190049913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,12288,1.436215082804362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,8192,0.4359270996517605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,12288,1.7398719787597656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,10240,1.201891581217448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,10240,1.4447484546237523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,8192,0.954712020026313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,7168,0.4629208776685927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,8192,1.1270009146796334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,6144,0.4353128804100885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,7168,0.8222177823384603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,7168,0.975521829393175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,6144,0.7047235700819227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,5120,0.3043733437856038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,51200,8.055881924099392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,4096,0.25671911239624023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,6144,0.9085209104749891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,5120,0.5915804439120823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,4096,0.49664889441596133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,3584,0.23065421316358778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,4096,0.6193182203504775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,3584,0.417647123336792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,3072,0.19400621785057914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,3584,0.5196337699890137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,3072,0.36094045639038086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,2560,0.15388266245524088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,3072,0.45637067159016925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,2560,0.3051839934455024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,2048,0.13838577270507812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,5120,0.7033155759175619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,65536,9.971852620442709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,2560,0.3867057694329156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,1536,0.10692355367872451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,1024,0.07373866770002577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,2048,0.24568978945414224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,51200,7.381958855523004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,2048,0.3051564428541395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,1536,0.1964497831132677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,1536,0.23688443501790366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,768,0.056998219754960805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,512,0.04354755414856804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,1024,0.1316479974322849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,1024,0.1644373337427775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,256,0.029292444388071697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,768,0.13695022794935438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,512,0.10366577572292751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,128,0.02459999918937683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,256,0.0633466641108195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,256,0.07353244225184123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,64,0.020717332760492962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,6144,32,0.021233777205149334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,128,0.055756443076663546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,128,0.055910223060184054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,64,0.05406399899058872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,32,0.05331200030114916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,6144,65536,9.643420749240452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,768,0.1071431106991238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,6144,512,0.08161777920193143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,16384,0.8507102330525717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,16384,1.8088328043619792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,51200,2.859595616658529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,65536,3.6381708780924478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,12288,0.6214506891038682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,10240,0.537451532151964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,16384,2.1399866739908853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,12288,1.3052106433444552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,8192,0.4272204505072699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,12288,1.627688937717014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,10240,1.1668151219685872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,10240,1.3399786419338648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,7168,0.3517724408043756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,8192,1.110073725382487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,6144,0.308281766043769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,51200,6.295742034912109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,7168,0.7531004481845431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,8192,1.0638186136881511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,5120,0.27948445743984646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,7168,0.9449955622355143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,6144,0.688151094648573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,4096,0.21274044778611925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,5120,0.5431564648946127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,6144,0.798191123538547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,3584,0.17355644702911377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,4096,0.4424897829691569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,5120,0.7102586428324381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,3072,0.14760533968607584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,4096,0.5509813096788194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,3584,0.38422134187486434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,3584,0.4852471351623535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,2560,0.1261377731959025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,3072,0.3359377649095323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,2048,0.10313422150082058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,65536,8.39011976453993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,2560,0.2811422348022461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,3072,0.4253235658009847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,1536,0.08150311311086018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,2048,0.2270053227742513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,1024,0.0565519995159573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,2560,0.35559466150071883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,2048,0.2816862265268962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,768,0.04849244488610161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,1536,0.21689066621992323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,512,0.03465422325664096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,1024,0.1201368835237291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,1024,0.1654284397761027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,768,0.12469244003295898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,768,0.09615821970833673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,512,0.07312977976269193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,512,0.09695288870069717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,256,0.06785421901279025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,128,0.021589333812395733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,256,0.05681155787573921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,64,0.01958933307064904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,51200,6.805922614203559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,128,0.04959555466969808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,32,0.020280889338917203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,128,0.05144800080193413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,64,0.046909332275390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,5120,65536,8.637674119737413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,32,0.046524445215861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,5120,1536,0.16837422053019205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,5120,256,0.026019554999139573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,16384,0.631989320119222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,51200,2.322697745429145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,65536,2.878886116875542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,12288,0.5557529131571451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,16384,1.5761920081244574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,16384,1.9166346655951605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,10240,0.41638578308953184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,12288,1.1718026267157662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,8192,0.3504800001780192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,12288,1.46143552992079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,10240,0.9676746792263455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,7168,0.31562754842970103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,10240,1.2245875464545357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,8192,0.8307386504279243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,6144,0.26974132325914174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,8192,0.9691964255438911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,51200,5.640781402587891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,7168,0.7108631134033203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,5120,0.218849778175354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,7168,0.8532791137695312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,4096,0.1618480020099216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,6144,0.6154301961263021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,5120,0.49537865320841473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,6144,0.7364328702290853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,3584,0.15156177679697672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,4096,0.39849244223700625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,5120,0.6733911302354602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,4096,0.5073759820726182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,3584,0.3515635596381293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,3072,0.13639911015828451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,51200,5.979538811577691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,2560,0.10832977957195705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,3584,0.44472355312771267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,2048,0.08375110891130234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,3072,0.308077335357666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,2560,0.25588178634643555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,1536,0.07019733058081733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,3072,0.387318213780721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,2048,0.20413511329227021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,2560,0.32634933789571124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,1024,0.04553777641720242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,2048,0.26463021172417533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,768,0.035754667388068304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,1536,0.15258577134874132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,768,0.08786044518152873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,1024,0.10846844646665786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,1536,0.1999466684129503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,512,0.027855998939938013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,256,0.01936533384852939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,1024,0.14329777823554143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,768,0.11555733945634629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,128,0.016200888488027785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,65536,7.7239990234375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,512,0.08984088897705078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,512,0.06599289178848267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,256,0.06240799691942003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,256,0.04970133304595947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,64,0.014454222387737699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,4096,32,0.015209777487648858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,4096,128,0.046675556235843234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,64,0.040095110734303795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,32,0.039023998710844256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,65536,7.514811197916667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,16384,0.6236773596869575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,4096,128,0.04272888766394722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,51200,1.9795182545979817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,12288,0.5048817528618706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,16384,1.4873741997612848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,65536,2.9335678948296438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,10240,0.37586400243971085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,16384,1.8650336795383031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,12288,1.1287742190890842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,12288,1.4022133085462782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,8192,0.2933768961164686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,10240,1.0147342681884766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,10240,1.1749946806165907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,7168,0.25327910317314994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,8192,0.7425395647684733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,51200,4.97254392835829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,6144,0.23129510879516602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,7168,0.6519689030117458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,5120,0.18717511494954428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,7168,0.8566711213853625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,6144,0.5599866443210179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,4096,0.15997244252098933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,6144,0.823437319861518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,5120,0.47084358003404403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,3584,0.13376800219217935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,51200,5.826598273383246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,5120,0.6070213317871094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,65536,6.373984866672092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,8192,0.9620763990614148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,4096,0.37893422444661456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,3072,0.11920000447167291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,4096,0.4938257535298665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,3584,0.3360453446706136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,3072,0.2987591160668267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,2048,0.08428355720308091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,2560,0.24277244673834908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,3584,0.4343804518381755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,3072,0.3764782216813829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,1536,0.06593510839674208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,2560,0.31813422838846844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,1024,0.04477599925465054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,2048,0.19365866978963217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,1536,0.14469422234429255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,2048,0.25511111153496635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,768,0.03474044468667772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,1536,0.19318577978346083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,512,0.025839999318122864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,1024,0.10240088568793403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,1024,0.13895821571350098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,768,0.08247022496329413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,256,0.019371555911170114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,768,0.1122515598932902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,128,0.016151999433835346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,512,0.06260177824232313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,512,0.0866968896653917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,256,0.06006133556365967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,64,0.0177528891298506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,32,0.018522666560279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,65536,7.473624335394965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3584,128,0.044397334257761635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,64,0.036496887604395546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3584,2560,0.09238400061925252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,32,0.03459999958674113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,256,0.04656444324387444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3584,128,0.039048890272776283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,51200,1.5988515218098958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,16384,0.4913733270433214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,12288,0.40920445654127335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,65536,2.466567145453559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,16384,1.3878364562988281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,10240,0.3534426689147949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,12288,1.0662106408013237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,16384,1.7921129862467449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,8192,0.2741982142130534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,12288,1.3617661794026692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,10240,0.902680926852756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,7168,0.20913244618309867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,10240,1.1298408508300781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,8192,0.7311226526896158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,51200,4.6770854526095915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,6144,0.1973573366800944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,8192,0.9098889032999674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,7168,0.6266311009724935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,5120,0.16801067193349203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,6144,0.5333617528279623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,7168,0.8008142047458224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,4096,0.12858488824632433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,5120,0.44795020421346027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,6144,0.7042160034179688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,3584,0.1291146675745646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,5120,0.58151822619968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,65536,5.990577697753906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,4096,0.35962488916185165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,3072,0.1051795548862881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,2560,0.08072533210118611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,4096,0.47176090876261395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,3584,0.41707732942369247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,3072,0.276088900036282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,3072,0.36177865664164227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,2048,0.06901688708199395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,2560,0.23556176821390787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,1536,0.04779288834995694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,2560,0.30550400416056317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,1024,0.036962668100992836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,2048,0.18377333217196992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,2048,0.24405511220296225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,1536,0.13744710551367864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,1536,0.1851440005832248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,768,0.027066666218969557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,512,0.020635555187861126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,1024,0.09644533528221978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,1024,0.13315733273824057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,51200,5.561014387342666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,256,0.016125332978036668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,768,0.10691110955344306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,768,0.07842577828301324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,128,0.013210666676362356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,512,0.05820888943142361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,512,0.08274400234222412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,64,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,256,0.05659200085533989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,256,0.04250399933920967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,3072,32,0.012826667063766055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,128,0.03446577654944526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,128,0.04155110981729295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,64,0.03185333477126227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,32,0.03190044562021891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,3072,3584,0.3210551208919949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,3072,65536,7.1233876546223955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,16384,0.41983911726209855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,51200,1.395133336385091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,16384,1.3127724329630535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,65536,1.9231609768337672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,12288,0.351398229598999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,16384,1.728748427497016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,12288,0.9888827006022135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,10240,0.29356087578667533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,12288,1.315667576260037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,8192,0.2231982284122043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,10240,0.8285155296325684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,7168,0.20497332678900826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,8192,0.6641208860609267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,10240,1.1208586162990994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,6144,0.16274933020273843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,8192,0.9219253328111437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,51200,4.331131405300565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,7168,0.5979413456386989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,5120,0.12477421760559082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,6144,0.5035715632968479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,7168,0.7684817843967013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,5120,0.42599111133151585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,4096,0.10895822445551555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,6144,0.6628773477342393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,3584,0.0924711094962226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,5120,0.5571902063157823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,3072,0.08118310901853773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,4096,0.34020445081922746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,65536,5.504443698459202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,3584,0.29950043890211314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,4096,0.4528666602240668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,2560,0.07217511203553942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,51200,5.325282626681857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,3584,0.4062986638810899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,3072,0.2591911156972249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,2048,0.05882933404710558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,1536,0.04449866546524895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,3072,0.34683911005655926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,2560,0.21756711271074083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,1024,0.029931555191675823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,2560,0.29173776838514537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,1536,0.12929511070251465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,2048,0.17140089140997994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,768,0.022300443715519373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,2048,0.23435288005405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,1536,0.17688443925645617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,512,0.017256889078352187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,1024,0.0904195573594835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,256,0.013778666655222574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,1024,0.12660266293419734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,128,0.01183111137813992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,768,0.1021804412206014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,768,0.07249510950512357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,512,0.07867999871571858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,512,0.05442488855785794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,256,0.05381866627269321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,256,0.03804088963402642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,128,0.039092444711261325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,128,0.03123289015558031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,64,0.02882400155067444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2560,32,0.028113779094484117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2560,65536,6.806470235188802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,51200,1.0332169002956815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,64,0.010579555398888059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,65536,1.4920843972100153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,16384,0.3843119939168294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,12288,0.2795395586225721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2560,32,0.010674667027261523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,16384,1.2388630972968209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,10240,0.21742399533589682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,12288,0.9745697445339627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,16384,1.6471946504380968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,8192,0.1786044438680013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,10240,0.7803271081712512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,12288,1.2396408716837566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,7168,0.15109511216481528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,10240,1.038305812411838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,8192,0.6269920137193468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,51200,3.9766727023654513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,6144,0.1403084463543362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,8192,0.835908465915256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,7168,0.5509884622361925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,5120,0.10859111282560562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,6144,0.47461779912312824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,7168,0.7351093292236328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,4096,0.09649422433641221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,6144,0.6337955792744955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,5120,0.39672356181674534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,65536,5.094718085394965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,3584,0.08333333333333333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,4096,0.3215502103169759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,5120,0.5333449045817057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,3072,0.07031999693976508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,2560,0.05424000157250298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,4096,0.43260622024536133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,3584,0.2827848858303494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,2048,0.04649688800175985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,3072,0.2442542182074653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,3584,0.38223910331726074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,3072,0.33065954844156903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,2560,0.2782426675160726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,2048,0.16139022509256998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,51200,5.07548353407118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,2048,0.2224968804253472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,1536,0.11933422088623047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,1536,0.16810666190253365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,768,0.019654222660594516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,1024,0.11980088551839192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,1024,0.08250844478607178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,512,0.014930667148696052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,768,0.06739555464850532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,768,0.09655021958880955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,256,0.011682666838169098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,512,0.04965777860747444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,512,0.07408266597323947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,128,0.010341333018408881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,256,0.034332444270451866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,256,0.050332443581687085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,65536,6.486440022786458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,64,0.009657777845859528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,32,0.009992000129487779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,2048,128,0.03707911239729987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,128,0.028470221492979262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,2560,0.20841333601209852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,64,0.025733333494928148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,2048,32,0.024744888146718342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,1024,0.02514933380815718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,51200,0.8553333282470703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,65536,1.0391537348429363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,16384,0.3102702299753825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,2048,1536,0.03371999992264642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,12288,0.2270044485727946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,12288,0.8754871156480578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,16384,1.1866497463650174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,10240,0.1868248913023207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,16384,1.5983528561062281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,12288,1.232506646050347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,10240,0.7319164276123047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,8192,0.1365440024269952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,7168,0.11585777335696751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,10240,1.0113351609971788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,8192,0.5867830912272135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,6144,0.0997048881318834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,51200,3.6694933573404946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,7168,0.5197831259833442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,8192,0.8133840031094022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,5120,0.08932089143329197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,6144,0.4439431031545003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,7168,0.7162737846374512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,5120,0.3733475473192003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,4096,0.05992533100975884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,6144,0.616104867723253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,3584,0.05744355254703098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,5120,0.5193004608154297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,3072,0.05122311247719658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,65536,4.704137590196398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,4096,0.30215289857652455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,2560,0.04624355501598782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,3584,0.2653191089630127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,4096,0.41983911726209855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,3584,0.3701484468248155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,3072,0.22858932283189562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,3072,0.3210595448811849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,2560,0.19218044810824922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,1536,0.027285334136750963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,2560,0.2699413299560547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,2048,0.1519048876232571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,2048,0.21528532769944933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,1024,0.019955555597941082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,51200,4.9291403028700085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,768,0.01604977746804555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,1536,0.11106489102045695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,1536,0.16262933943006727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,512,0.012332444389661154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,1024,0.07655733161502414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,768,0.09257955683602227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,768,0.05861155854331123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,512,0.043895999590555825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,512,0.07117155525419447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,128,0.009326222042242685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,256,0.046851555506388344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,256,0.030826667944590252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,64,0.009907555249002244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,128,0.024681778417693243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,128,0.034809778134028115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,32,0.008646222452322641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,64,0.022341334157519873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1536,32,0.02161688937081231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,2048,0.03387466735310025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,65536,6.314091576470269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,65536,0.697646247016059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,51200,0.5670266681247288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1536,1024,0.11629954973856609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1536,256,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,16384,0.2031973335478041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,12288,0.12418488661448161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,12288,0.86553865008884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,16384,1.121847152709961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,10240,0.1139448881149292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,12288,1.1487661997477214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,8192,0.09236266877916123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,16384,1.524502224392361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,10240,0.684507581922743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,7168,0.07766489187876384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,8192,0.5489724477132162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,10240,0.9633786943223742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,8192,0.7752933502197266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,6144,0.07108889023462932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,7168,0.483284420437283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,51200,3.3880507151285806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,7168,0.6815528869628906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,5120,0.05167644553714328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,6144,0.41597599453396267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,4096,0.04598844382497999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,6144,0.5886773533291286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,5120,0.34978045357598203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,3584,0.04190133346451653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,4096,0.28188443183898926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,65536,4.332488165961371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,3072,0.035114665826161705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,4096,0.4003671010335286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,3584,0.24879021114773223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,2560,0.029493331909179688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,3584,0.35254044002956814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,3072,0.21467999617258707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,2048,0.024446222517225478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,3072,0.30641155772738987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,2560,0.17903378274705675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,1536,0.01941866676012675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,2560,0.2570506731669108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,1024,0.01460622251033783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,2048,0.2038266658782959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,1536,0.10296355353461371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,1536,0.15400266647338867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,768,0.012134222520722283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,1024,0.07048355870776706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,1024,0.11007999711566502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,768,0.05361688799328274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,768,0.08647822009192573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,256,0.007268444531493717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,512,0.039701332648595176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,512,0.06477777825461493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,128,0.006778666542636023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,256,0.0273973329199685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,256,0.04458933406405979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,64,0.007214222517278459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,128,0.02163022259871165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,128,0.0325911111301846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,32,0.007290666302045186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,65536,6.0161866082085504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,64,0.019241778386963736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,32,0.018545778261290658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,1024,2048,0.14114399751027426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,51200,4.706657833523221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,65536,0.5451368755764431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,51200,0.4046773380703396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,1024,512,0.009025777379671732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,16384,0.15632355213165283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,1024,5120,0.49442222383287215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,12288,0.11932978365156387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,12288,0.7913297547234429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,16384,1.0615510940551758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,10240,0.08976178036795722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,16384,1.4851680331759984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,12288,1.1465253829956055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,8192,0.07247910896937053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,10240,0.6626035372416178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,7168,0.061590221193101674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,10240,0.9386559592352973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,8192,0.5312453375922309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,6144,0.055239998632007174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,7168,0.46795468860202366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,6144,0.40221601062350804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,7168,0.664463996887207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,5120,0.04529777831501431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,51200,3.256588406032986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,4096,0.039368887742360435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,6144,0.5732293128967285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,5120,0.33839111857944065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,3584,0.031073778867721558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,5120,0.48089599609375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,4096,0.2733111116621229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,3072,0.027637332677841187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,65536,4.1660745408799915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,4096,0.38983111911349827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,3584,0.24067645602756074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,2560,0.02436711059676276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,8192,0.7555937767028809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,2048,0.01997244523631202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,3072,0.20762044853634307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,3584,0.34316176838344997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,1536,0.015950222810109455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,2560,0.17357867293887666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,3072,0.29782221052381724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,2560,0.25108355946011013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,2048,0.1364106602138943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,1024,0.012426666915416718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,2048,0.1977084477742513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,1536,0.099708444542355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,768,0.010064889159467485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,512,0.00794666674402025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,1536,0.14950666162702772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,1024,0.06891910897360908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,256,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,768,0.08520266744825576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,768,0.05300977826118469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,512,0.06423644224802653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,512,0.036561777194341026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,128,0.0058746664888328975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,256,0.025761778155962627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,51200,4.589681837293837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,256,0.04293244414859348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,64,0.007948444121413762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,128,0.019606222709019978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,128,0.0314977765083313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,64,0.01761777698993683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,768,32,0.016944888565275405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,65536,0.40017067061530215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,51200,0.3018435637156169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,65536,5.876338534884983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,16384,0.10096266534593369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,768,1024,0.10681866937213474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,12288,0.07304710812038846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,768,32,0.005218666460778978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,16384,1.0104266272650826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,12288,0.7602462238735623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,10240,0.06084622277153862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,12288,1.0910835266113281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,16384,1.4481724633110895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,8192,0.05276088913281759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,10240,0.6356453365749782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,7168,0.04202399982346428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,10240,0.9155546824137369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,8192,0.5117786725362142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,6144,0.03659644391801622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,8192,0.7354008886549207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,7168,0.4491875436570909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,5120,0.03087377879354689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,6144,0.38710488213433164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,7168,0.647708468967014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,4096,0.02481777800454034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,5120,0.3249439928266737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,6144,0.5581946902804905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,3584,0.022408000297016565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,65536,4.010496775309245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,4096,0.263267543580797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,5120,0.46920087602403426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,3072,0.01936444474591149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,4096,0.3787279923756917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,3584,0.23109067810906303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,2560,0.01713511182202233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,3584,0.3345199955834283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,3072,0.1991751061545478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,2048,0.014513777361975776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,3072,0.29007289144727916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,2560,0.1668684482574463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,1536,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,2560,0.24403643608093262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,1024,0.008996444443861643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,2048,0.13147555457221136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,2048,0.19336533546447754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,51200,3.138257768419054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,1536,0.09502577781677246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,1536,0.14571821689605713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,768,0.007981333467695449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,512,0.006637333167923822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,1024,0.0654568870862325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,1024,0.10317155387666489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,256,0.0052800000541739995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,51200,4.474029541015625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,768,0.08272088898552789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,768,0.04924799998601278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,512,0.03529599971241421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,128,0.004555555681387584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,512,0.061358220047420926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,256,0.04119911127620273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,64,0.004517333375083076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,512,32,0.004569777597983678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,256,0.024018666810459558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,128,0.01828266680240631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,128,0.030184000730514526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,64,0.016193777322769165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,512,32,0.01549600064754486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,65536,0.23404177029927573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,16384,0.05753155549367269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,51200,0.1804115507337782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,12288,0.04422755704985725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,512,65536,5.719514634874131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,12288,0.7383102311028374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,10240,0.03751555416319106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,16384,1.0001519521077473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,16384,1.4054560131496852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,8192,0.03151466780238681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,12288,1.0612026850382488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,10240,0.6151750882466634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,7168,0.027664000789324444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,10240,0.8892737494574653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,8192,0.49524354934692383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,6144,0.02355466617478265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,7168,0.43486666679382324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,8192,0.7153849071926541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,5120,0.016728000508414376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,6144,0.3743280039893256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,7168,0.6295315424601237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,4096,0.014270222849316068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,51200,3.0263902876112194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,5120,0.314102225833469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,5120,0.45543909072875977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,3584,0.01276622215906779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,4096,0.2544168896145291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,4096,0.3685146702660455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,3072,0.011681777735551199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,3584,0.2238017717997233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,65536,3.870904710557726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,3584,0.3250844478607178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,3072,0.19273066520690918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,3072,0.2815919982062446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,2560,0.16127288341522217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,2048,0.008745777938101027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,2560,0.23742845323350695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,6144,0.5428009033203125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,1536,0.007658667034573025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,51200,4.351482815212674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,2048,0.12601866987016466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,1024,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,1536,0.09105866485171848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,1536,0.14107467068566218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,768,0.005609777652555042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,1024,0.06231377522150675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,1024,0.09944088591469659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,512,0.004912888838185204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,768,0.04685777756902906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,768,0.08005066712697347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,256,0.004224888980388641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,512,0.032983111010657415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,512,0.058669335312313504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,128,0.003663111064169142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,256,0.039727999104393855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,256,0.02234755622016059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,64,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,32,0.003555555724435382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,256,2560,0.01074577785200543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,128,0.028817776176664565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,128,0.016551110479566786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,64,0.014488889111412896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,256,32,0.014083556003040738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,51200,0.13987555768754747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,65536,5.563200208875869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,65536,0.1803893380694919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,16384,0.04622311062282986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,12288,0.03570400012864007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,256,2048,0.18669422467549643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,12288,0.722483581966824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,16384,0.9588052961561414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,10240,0.03016977839999729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,12288,1.057132403055827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,8192,0.025655110677083332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,16384,1.402726173400879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,10240,0.60444090101454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,7168,0.022611555125978258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,10240,0.8864631123012967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,8192,0.4867635303073459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,6144,0.01576622161600325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,8192,0.7133733431498209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,6144,0.3675146632724338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,5120,0.011861333416567909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,7168,0.6274684270222982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,51200,2.9623671637641062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,4096,0.009917333722114563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,6144,0.5414480103386773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,5120,0.30863110224405926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,3584,0.008991111483838823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,5120,0.45455291536119247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,4096,0.24897421730889213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,3072,0.007994666695594788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,4096,0.367977778116862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,3584,0.21917243798573813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,65536,3.794109344482422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,7168,0.42714399761623806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,3072,0.18844000498453775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,3584,0.3240026632944743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,2048,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,3072,0.28073867162068683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,2560,0.1578071117401123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,1536,0.00591555568906996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,2560,0.2371119923061795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,2048,0.1230328877766927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,2048,0.18569778071509468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,1536,0.08864800135294597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,1536,0.14048177666134304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,768,0.004519999855094486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,1024,0.06037155787150065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,1024,0.09939466582404242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,512,0.003903999924659729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,51200,4.329842461480035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,768,0.07829333013958402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,768,0.04607022139761183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,256,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,512,0.03212889035542806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,512,0.05848977963129679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,256,0.039080000585979886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,256,0.021644444929228887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,64,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,32,0.0032257777121331957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,128,0.01579466627703773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,2560,0.007301333049933116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,32,0.01313244468635983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,65536,0.18060178226894805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,65536,5.538949330647786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,1024,0.0052284445199701525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,51200,0.13345777988433838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,16384,0.05141511228349474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,12288,0.03650310966703627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,128,128,0.0032355555643637977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,10240,0.0292524430486891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,128,64,0.013723555538389417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,8192,0.024890666206677754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,12288,0.7168266508314344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,7168,0.02151288919978672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,16384,0.9531119664510092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,6144,0.014803555276658801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,10240,0.5990239779154459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,5120,0.010098666780524785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,8192,0.4834773275587294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,4096,0.008664000365469191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,3584,0.007984889050324758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,7168,0.4227724340226915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,3072,0.007296000089910295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,6144,0.3638870981004503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,5120,0.3052204449971517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,2560,0.007287110719415877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,2048,0.006267555471923616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,4096,0.2465448909335666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,3584,0.21688532829284668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,1536,0.00554577757914861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,3072,0.18713066313001844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,1024,0.004902222090297275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,768,0.004233777936961916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,2560,0.1558497746785482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,2048,0.1225679980383979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,512,0.0038604442444112566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,1536,0.08751289049784343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,256,0.0032239999208185407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,1024,0.060327112674713135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,128,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,768,0.0445128877957662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,64,0.003006222140457895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,512,0.03163199954562717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,64,32,0.0028853333658642242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,256,0.020789333515697055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,128,0.0151573336786694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,64,0.013397333522637686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,32,0.013088000317414602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,65536,0.1710560056898329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,51200,0.12668355305989584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,16384,0.046748446093665234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,12288,0.03630133469899496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,10240,0.027727110518349543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,51200,2.9458204905192056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,8192,0.023648000425762598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,12288,0.7160648769802518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,10240,0.5991759830050999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,64,65536,3.7686169942220054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,7168,0.020742222666740417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,6144,0.012306667036480375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,16384,0.952723503112793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,5120,0.009376000199053023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,4096,0.007640000018808577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,8192,0.4820995330810547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,3584,0.007284444239404466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,6144,0.36359379026624894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,7168,0.42281333605448407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,5120,0.30540622605217826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,3072,0.006609777609507243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,4096,0.24671732054816353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,2560,0.005917333480384614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,2048,0.005233777893914117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,3584,0.21883022785186768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,1536,0.005605333381228977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,1024,0.004705777598751916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,2560,0.15746133857303196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,2048,0.12383466296725804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,768,0.0042275554604000514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,512,0.0038622220357259116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,1024,0.06044444772932264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,256,0.0032186667538351486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,768,0.0451546675629086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,128,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,256,0.020984888076782227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,64,0.002883555574549569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,128,0.015189333094490899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8192,32,32,0.0028817777832349143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,64,0.013345777988433838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,32,0.012811555630630918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,51200,2.9406941731770835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,3072,0.18845600552029082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,1536,0.08860088719262017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,512,0.03186933199564616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8192,32,65536,3.7716454399956594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,10240,3.777006361219618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,12288,4.574415842692058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,12288,4.921947479248047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,16384,6.0132569207085504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,16384,7.222303602430556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,8192,3.0525332556830516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,7168,2.559768040974935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,8192,3.0859440697564016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,10240,3.8974168565538196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,7168,2.664783901638455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,5120,1.8548293643527562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,6144,2.1709103054470487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,6144,2.262645297580295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,4096,1.3824400371975367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,5120,1.8961128658718531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,3584,1.3066000408596463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,4096,1.464805285135905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,3584,1.3115306430392795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,3072,1.0291413201226127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,2560,0.8890462451510959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,3072,1.1235777537027996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,2560,0.9365012910630969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,1024,0.35737066798739964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,1536,0.5318035549587673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,1536,0.5980621973673502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,2048,0.7790391180250379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,768,0.28818223211500377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,512,0.20852000183529326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,1024,0.4900088840060764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,768,0.35241156154208714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,256,0.1520693302154541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,128,0.12079466713799371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,256,0.26993778016832143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,64,0.10328621996773614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,32,0.10934311151504517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,128,0.25585420926411945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,64,0.2577093442281087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,32,0.2592346668243408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,2048,0.7131191359625922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,512,0.33309245109558105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8192,128,128,0.0284826656182607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,65536,51200,18.67053731282552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,16384,4.28602557712131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,12288,3.291224797566732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,16384,5.448002709282769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,12288,3.8075599670410156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,10240,2.9311165279812283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,10240,3.1164311303032766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,8192,2.3031092749701605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,7168,1.9531591203477647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,65536,51200,27.343865288628475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,8192,2.39920531378852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,6144,1.6155243979560003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,5120,1.404280874464247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,6144,1.8105227152506511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,51200,13.497911241319445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,7168,2.0748621622721353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,4096,1.0951822068956163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,3584,1.0153875350952148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,4096,1.184883541531033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,5120,1.4917173385620117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,3584,1.0519093407524955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,3072,0.9516773223876953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,2560,0.6340053346421983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,2048,0.6135039859347874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,2560,0.7430968814425998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,3072,0.8734230995178223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,1536,0.41671911875406903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,1024,0.2831351227230496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,768,0.23234134250217012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,1024,0.358063989215427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,2048,0.784647093878852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,1536,0.5867555406358507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,512,0.17384621832105848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,256,0.11710933844248454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,512,0.23795644442240396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,128,0.12296356095208062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,256,0.22124977906545004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,64,0.0816462238629659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,128,0.200673778851827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,32,0.08641066816118027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,32,0.2061920033560859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,64,0.21024978160858154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,51200,65536,17.687203301323784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,768,0.3154746691385905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,16384,1.5770817862616644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,16384,2.0248436397976346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,12288,1.0266382429334853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,51200,4.356530507405599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,10240,0.9901644388834635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,12288,1.454072846306695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,51200,21.656324598524307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,8192,0.7978969150119357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,65536,5.55038579305013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,8192,0.946056048075358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,7168,0.6437830924987793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,10240,1.209082709418403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,6144,0.5871431032816569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,5120,0.5294391314188639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,6144,0.7015360196431478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,4096,0.41151822937859434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,7168,0.9464693069458008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,5120,0.583847098880344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,3584,0.2938275602128771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,3072,0.28058311674329967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,4096,0.5377813445197211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,2560,0.21667467223273384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,3072,0.3443902333577474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,3584,0.44374667273627383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,2048,0.17919554975297716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,2560,0.31096000141567653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,1536,0.13388710551791722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,1024,0.09699377748701309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,2048,0.23930578761630586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,768,0.08420799838172065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,1536,0.21216355429755318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,512,0.06063555346594917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,1024,0.14359022511376276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,256,0.03972533345222473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,128,0.03376177615589566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,512,0.09587377972073025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,64,0.029383109675513372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,256,0.08022310998704699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,16384,32,0.029098666376537744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,128,0.07525066534678142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,64,0.07537333170572917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,32,0.07619644535912408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,51200,8.271339416503906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,768,0.11221244600084092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,16384,0.9560089111328125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,16384,1.6337608761257594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,12288,0.7856782277425131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,51200,3.2092925177680125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,10240,0.6379920111762153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,16384,65536,12.331715053982206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,12288,1.1695742077297635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,8192,0.5453235308329264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,65536,4.275178697374132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,10240,0.9842533535427518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,7168,0.46378845638699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,6144,0.41802310943603516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,8192,0.7922124332851834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,5120,0.38832889662848574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,7168,0.697656896379259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,4096,0.2531786759694417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,6144,0.5720835791693794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,3584,0.24347734451293945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,3072,0.19741511344909668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,5120,0.571000893910726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,4096,0.4387093385060628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,2560,0.17097777790493437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,3584,0.3826871183183458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,3072,0.29046400388081867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,2048,0.13411822583940294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,1536,0.10398577981524998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,2560,0.252039114634196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,1024,0.07413422399097018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,768,0.05898133251402113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,2048,0.2269244458940294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,512,0.040707555082109236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,1536,0.1584497822655572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,1024,0.11746044953664143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,256,0.030662222041024104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,768,0.10149066978030735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,128,0.02695200012789832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,64,0.0247688889503479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,512,0.08064533604515924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,256,0.06553955872853597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,12288,32,0.025584000680181716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,128,0.05997955799102783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,64,0.06066133578618368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,32,0.06188978089226616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,51200,6.424955579969619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,16384,0.9103458192613391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,12288,0.6201786465115017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,16384,1.440651575724284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,12288,65536,9.27532704671224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,51200,2.7774071163601346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,10240,0.5825040075514052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,12288,1.047350247701009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,8192,0.4660373263888889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,65536,3.447015126546224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,7168,0.3986062208811442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,51200,65536,35.27095201280382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,10240,0.8871155314975314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,8192,0.744110213385688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,5120,0.25933954450819224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,6144,0.3570248815748427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,4096,0.2102515565024482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,6144,0.5616284476386176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,7168,0.662775993347168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,3584,0.21988356113433838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,5120,0.427856895658705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,4096,0.35393688413831925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,3072,0.17239644792344835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,2560,0.15856088532341853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,2048,0.10928444729910956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,3584,0.2944977813296848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,3072,0.2575431134965685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,1536,0.0986951125992669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,2560,0.2118826707204183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,1024,0.060416890515221484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,2048,0.18205511569976807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,768,0.05487377776039971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,512,0.036269333627488874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,256,0.0351217786471049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,1536,0.13883645004696316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,1024,0.10339111089706421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,128,0.022755554980701868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,512,0.06852089034186469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,64,0.019201777047581144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,256,0.056530667675866016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,10240,32,0.01928444372283088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,128,0.052074667480256825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,64,0.0524888899591234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,32,0.052786668141682945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,51200,5.7052001953125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,768,0.08218133449554443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,16384,0.7545982466803657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,12288,0.5926897790696886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,51200,2.195847193400065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,16384,1.238960901896159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,10240,65536,7.896883646647136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,10240,0.479872014787462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,65536,2.9078648885091147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,12288,0.9022888607449002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,8192,0.35967289076911074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,7168,0.3310160107082791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,6144,0.2656444443596734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,10240,0.769504017300076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,8192,0.6144560178120931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,5120,0.228965335422092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,4096,0.18758666515350342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,6144,0.5645128885904948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,3584,0.16272621684604222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,5120,0.3900302251180013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,7168,0.567397329542372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,3072,0.15505333741505942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,4096,0.29775910907321507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,2560,0.12044800652398004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,3584,0.26669687694973415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,2048,0.09299288855658637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,1536,0.06810133324729072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,3072,0.25018488036261666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,1024,0.049046221706602305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,2560,0.1882044474283854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,768,0.03910488883654276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,2048,0.15338667233784994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,512,0.030563556485705908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,256,0.021457778082953557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,1024,0.0910080009036594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,128,0.0181048893266254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,768,0.08208711279763116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,64,0.01535288823975457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,512,0.06111466884613037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,8192,32,0.015837333268589444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,256,0.047945777575174965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,128,0.043883555465274386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,64,0.04504088891877068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,32,0.04354666670163473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,51200,4.519125196668837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,16384,0.600728882683648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,1536,0.12132355901930068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,12288,0.4828791088528103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,16384,1.1576737297905815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,10240,0.4314017825656467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,51200,1.822058571709527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,8192,65536,6.398313734266494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,12288,0.8316062291463217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,8192,0.358151117960612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,7168,0.26461866166856557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,65536,2.374737845526801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,10240,0.6948889096577963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,6144,0.2723955578274197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,5120,0.19849510987599692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,7168,0.4855288929409451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,8192,0.5852844450208876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,4096,0.1815377738740709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,3584,0.14529155360327825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,3072,0.12949689229329428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,6144,0.5101591216193305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,5120,0.3480568991767035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,3584,0.2422880066765679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,2560,0.10972622368070815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,4096,0.30337688657972545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,2048,0.0870257748497857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,1536,0.06945244471232097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,3072,0.20516622066497803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,2560,0.1839991145663791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,768,0.03511733478969998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,1536,0.11472177505493164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,512,0.025906667113304138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,256,0.01953866746690538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,1024,0.09667733642790054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,128,0.01953066719902886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,768,0.06755289104249743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,512,0.05573866764704386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,64,0.01442577772670322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,256,0.043861332866880626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,32,0.014771555860837301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,128,0.04168444540765551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,64,0.038564443588256836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,32,0.0367253323396047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,51200,4.196156395806207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,7168,1024,0.04424444503254361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,2048,0.1434266699684991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,16384,0.5420586797926161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,12288,0.4824230935838487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,51200,1.8062790764702692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,16384,1.0449128680759006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,7168,65536,5.74112531873915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,65536,2.208949406941732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,8192,0.2645671102735731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,10240,0.3755839930640326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,6144,0.20328088601430258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,7168,0.24140532811482748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,10240,0.6376258002387153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,12288,0.8098897933959961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,5120,0.1753822167714437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,8192,0.5743858019510905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,4096,0.13976532883114284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,7168,0.5384871164957682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,3584,0.12290310859680176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,6144,0.38553423351711696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,5120,0.32178934415181476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,3072,0.10290577676561143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,2560,0.0914720031950209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,2048,0.06881244315041436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,4096,0.3085270987616645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,3584,0.22121244006686738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,1536,0.05330577823850843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,1024,0.03729688790109422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,3072,0.1908257802327474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,2560,0.1600302192899916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,768,0.028584000137117174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,512,0.020964443683624268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,2048,0.13134666283925375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,1536,0.1178284486134847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,1024,0.07835911379920112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,768,0.06234044498867459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,128,0.015494222442309061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,64,0.01788444485929277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,256,0.0377511117193434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,32,0.018617777360810172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,128,0.03495644529660543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,64,0.03427555494838291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,32,0.03292444348335266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,51200,3.7537138197157116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,16384,0.44368799527486164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,6144,256,0.01703288820054796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,512,0.049365331729253135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,6144,65536,5.0721965365939665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,12288,0.3115431202782525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,51200,1.5426728990342882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,10240,0.31120178434583873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,65536,1.9156445397271051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,8192,0.26409244537353516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,16384,0.9972968631320529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,12288,0.7048124207390679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,10240,0.586942195892334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,6144,0.1736382246017456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,5120,0.13653243912590876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,6144,0.355545785692003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,8192,0.612609757317437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,4096,0.11700444751315647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,7168,0.5313039885626899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,5120,0.31674133406745064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,3584,0.10466400119993423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,3072,0.08152800136142306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,2560,0.07878755860858493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,4096,0.23262045118543836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,2048,0.05993688768810696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,3584,0.20750578244527182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,1536,0.044920000765058726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,1024,0.033258666594823204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,2560,0.14880977736579046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,768,0.02490844494766659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,2048,0.1195253398683336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,1536,0.0960364474190606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,512,0.018114666144053142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,256,0.01425333321094513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,1024,0.07466310924953885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,512,0.04443200098143684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,128,0.01277599980433782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,64,0.01069155583779017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,256,0.03404355711407132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,7168,0.21861510806613496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,5120,32,0.010977778169843884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,128,0.030534221066368952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,64,0.03020533257060581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,51200,3.366545783148872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,32,0.029492444462246362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,16384,0.3737911118401422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,3072,0.1776968903011746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,65536,4.241552988688151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,12288,0.25747288597954643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,5120,768,0.058008001910315625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,51200,1.1153092914157443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,10240,0.24423821767171225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,8192,0.19172355863783094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,16384,0.8782880041334363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,12288,0.626039981842041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,7168,0.16956444581349692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,10240,0.5254000027974447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,6144,0.1365777783923679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,5120,0.11417510774400498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,8192,0.5224426587422689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,7168,0.37578754954867893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,4096,0.09374488724602593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,6144,0.3506035539839003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,3584,0.07889866828918457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,5120,0.27047822210523814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,3072,0.07323733303281996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,4096,0.2123697731229994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,2560,0.06104355388217502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,3584,0.20076889461941191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,2048,0.04681333237224155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,3072,0.15635377830929226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,1536,0.0354639987150828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,2560,0.1301386621263292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,1024,0.025390222668647766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,768,0.02057422200838725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,65536,1.483501328362359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,1536,0.08547111352284749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,512,0.014601776997248331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,1024,0.06283555428187053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,256,0.011691555380821228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,768,0.052431109878751964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,128,0.011052444577217102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,512,0.038776887787712946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,64,0.010319111247857412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,256,0.029491557015313044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,4096,32,0.010374222364690568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,128,0.027126222848892212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,51200,2.9167982737223306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,64,0.026114667455355327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,32,0.02574133376280467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,16384,0.28642222616407603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,65536,3.6301867167154946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,4096,2048,0.1103279987970988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,12288,0.22988888952467176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,51200,0.9277839660644531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,10240,0.20515199502309164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,65536,1.2565111584133573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,8192,0.14748088518778482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,16384,0.8053466478983561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,7168,0.15590311421288386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,6144,0.11667822466956244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,12288,0.5957297748989528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,5120,0.091666665342119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,10240,0.552295102013482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,8192,0.44074222776624894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,7168,0.35504889488220215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,3584,0.06932977835337321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,6144,0.390430212020874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,5120,0.2555928760104709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,4096,0.20726933744218615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,2560,0.052896890375349254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,3584,0.17554222212897408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,2048,0.03911822372012668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,3072,0.15420533551110163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,2560,0.1254835526148478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,1024,0.0247688889503479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,2048,0.10190577639473809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,768,0.020578665865792167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,1536,0.08331466383404203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,512,0.016125332978036668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,1024,0.05894666910171509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,768,0.04732622371779548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,256,0.01201866649919086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,128,0.009645333720578088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,512,0.036320888333850436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,51200,2.653847164577908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,64,0.008626666333940294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,256,0.0276826669772466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,32,0.008957333034939235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,128,0.025361778007613286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,4096,0.07611822419696383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,32,0.024043555061022442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,3072,0.05979022052552965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3584,1536,0.0318853325313992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,65536,3.397959179348416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,16384,0.29831822713216144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,12288,0.20997599760691324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,51200,0.8326462109883627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,10240,0.17421244250403511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,65536,1.1831075880262587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,8192,0.1410613324907091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,12288,0.5755768881903754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3584,64,0.024950222836600408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,7168,0.11869777573479547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,6144,0.10109511348936294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,10240,0.5542382134331597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,5120,0.08972533543904622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,8192,0.4561946656968858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,4096,0.06682755549748738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,7168,0.33698132303025985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,6144,0.32567021581861705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,3072,0.05601244502597385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,5120,0.2501208782196045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,4096,0.20897421571943495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,2560,0.04529066549407112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,3584,0.16573422484927708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,2048,0.03517599900563558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,1536,0.028057777219348486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,3072,0.150036440955268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,2560,0.11905777454376221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,2048,0.09661689069535996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,1024,0.020111999577946134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,768,0.016195555528004963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,1536,0.07436711258358426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,512,0.012150222228633033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,1024,0.05531555414199829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,768,0.043803556097878345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,256,0.009705777797434065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,16384,0.7514630953470866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,51200,2.487412346733941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,512,0.03391199972894456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,128,0.009142222503821055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,32,0.008628444539176093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,64,0.00835111074977451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,256,0.02580533259444767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,128,0.02330577704641554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,64,0.022668444448047217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,32,0.02235466738541921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,3072,3584,0.06296355856789483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,3072,65536,3.1505218082004123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,16384,0.227164453930325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,12288,0.17843022611406115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,51200,0.6994560029771594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,10240,0.1760186619228787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,65536,1.001524395412869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,8192,0.12922222084469265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,12288,0.5361048910352919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,16384,0.706776883867052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,7168,0.1338746680153741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,6144,0.09491644303003947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,5120,0.09744799799389309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,10240,0.4888426462809245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,8192,0.3617271052466498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,4096,0.07890666855706109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,6144,0.2736568980746799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,7168,0.34259290165371364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,3584,0.0586986674202813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,5120,0.2286773257785373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,3072,0.04917422268125746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,2560,0.0417191121313307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,2048,0.03534311056137085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,4096,0.18544888496398926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,1536,0.027279999521043565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,3584,0.18852444489796957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,3072,0.1360702249738905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,1024,0.02012800011369917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,2560,0.11146222220526801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,768,0.014354666074117025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,512,0.011439111497667102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,2048,0.09114755524529351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,1536,0.07170044713550143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,1024,0.052829331821865506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,128,0.008407110969225565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,768,0.0411484440167745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,512,0.0314977765083313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,64,0.007316444483068254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,256,0.024346666203604803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,32,0.007262222468852997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,128,0.021662222014533147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,64,0.020954666866196528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,32,0.020599999361568026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,51200,2.290365431043837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,16384,0.1731519964006212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,12288,0.13430578178829616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,51200,0.5452639791700575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,65536,0.6580266422695583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,10240,0.12063022454579671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2560,65536,2.9176239437527127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,8192,0.10136977831522624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,16384,0.6668195724487305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2560,256,0.009014222357008193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,7168,0.08265688684251574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,12288,0.5213511255052354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,6144,0.06704088714387682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,10240,0.4600542386372884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,5120,0.0559519992934333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,8192,0.3394346767001682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,3584,0.03910488883654276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,7168,0.2995262145996094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,3072,0.035840001371171736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,5120,0.21535555521647134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,2560,0.03033866816096836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,3584,0.1469377809100681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,2048,0.025447110335032146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,2560,0.10485600100623237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,1536,0.019527999891175162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,2048,0.08469066354963516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,1024,0.01477777792347802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,1536,0.06505955590142144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,768,0.012019555601808759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,1024,0.04559822214974297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,51200,2.099435594346788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,512,0.009577777650621202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,256,0.007304888632562425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,768,0.038338667816585965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,512,0.029494222667482164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,128,0.006979555719428592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,256,0.022268444299697876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,4096,0.044793777995639376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,64,0.00628266649113761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,2048,32,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,128,0.020003555549515616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,6144,0.2894328965081109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,65536,2.6942168341742625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,4096,0.1719199948840671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,32,0.01900888813866509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,3072,0.12434044149186875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,51200,0.3960551155938043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,65536,0.5562799771626791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,12288,0.10382311211691962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,10240,0.0977591143714057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,16384,0.6277750862969292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,8192,0.07377955648634169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,12288,0.5036693149142796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,2048,64,0.018931556079122756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,7168,0.061292443010542125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,10240,0.410317341486613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,6144,0.05275200141800774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,5120,0.043493333790037364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,4096,0.034803556071387395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,8192,0.32115644878811306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,16384,0.13623378011915419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,3584,0.030273778571022883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,7168,0.2869493431515164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,3072,0.027943111128277246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,5120,0.2041768895255195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,4096,0.16274933020273843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,2048,0.020070221689012315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,3584,0.1397493282953898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,3072,0.11924178070492214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,1536,0.015248000621795654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,2560,0.09802666637632583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,2048,0.08080444733301799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,51200,1.9660453796386719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,768,0.009753777749008602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,1024,0.0432275566789839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,768,0.03508088986078898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,256,0.006350222147173352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,512,0.027461333407296076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,128,0.005940444353553984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,65536,2.5087413787841797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,64,0.005558222118351195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,128,0.0181377778450648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,32,0.005947555518812603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,64,0.017352888981501263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,6144,0.24380177921719023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,32,0.017160000072585214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,2560,0.022668444448047217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,1024,0.011648000114493899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,65536,0.36400800281100804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,51200,0.28624354468451607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,16384,0.090810669793023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,12288,0.07325155867470635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1536,512,0.007670222057236566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,10240,0.06040710873074002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,8192,0.04730311036109924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,256,0.020596444606781006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,12288,0.44318400488959414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,10240,0.37177689870198566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,16384,0.6202106475830078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,7168,0.041486223538716636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,8192,0.31328709920247394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,6144,0.035904887649748064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,5120,0.030241777499516804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,4096,0.02496533261405097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,3584,0.022008889251285132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,7168,0.2645911110772027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,6144,0.23114400439792207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,5120,0.19215199682447645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,4096,0.15077866448296443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,3072,0.019704000817404855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,2560,0.01772444446881612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,2048,0.014496889379289416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,3584,0.13048444853888616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,1536,0.011908444265524546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,1024,0.009367999931176504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,3072,0.11007644732793172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,2560,0.0916595525211758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,2048,0.07495733102162679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,768,0.008205333517657386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,512,0.0069253332912921906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,1536,0.058189332485198975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,256,0.005607999861240387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,1024,0.03958755400445726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,128,0.004936888813972473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,768,0.03253600001335144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,64,0.0046746668716271715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,512,0.025647999511824712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,1024,32,0.004924444274769889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,51200,1.816525353325738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,256,0.018894222047593858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,128,0.016488000750541687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,64,0.015797333584891427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,32,0.01517777807182736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,16384,0.08026844263076782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,51200,0.2428373230828179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,65536,0.2942613230811225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,12288,0.06012533108393351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,10240,0.04820355441835192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1024,65536,2.3182347615559897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,8192,0.038873778449164495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,10240,0.3585964573754205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,16384,0.5662497944302028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,12288,0.464004463619656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,7168,0.037047111325793795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,6144,0.029512001408471003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,8192,0.29025689760843915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,5120,0.026239999466472205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,1536,1536,0.06394400199254353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,4096,0.02201955517133077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,3584,0.01830222209294637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,7168,0.25508801142374676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,6144,0.21961155202653673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,3072,0.015799111790127225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,5120,0.18418310748206246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,2560,0.013822221921549903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,2048,0.011640888949235281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,4096,0.14524443944295248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,3584,0.1273662249247233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,1536,0.009687999884287516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,1024,0.00797333319981893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,3072,0.10550844669342041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,2560,0.08787377675374348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,768,0.006591111007663939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,2048,0.07174844212002225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,512,0.005888000130653381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,1536,0.05575199921925863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,256,0.004880889008442561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,1024,0.03806666533152262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,128,0.00423200014564726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,64,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,768,0.03121688961982727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,512,0.024336000283559162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,768,32,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,256,0.018201778332392376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,51200,1.745664914449056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,128,0.015489778584904142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,64,0.014818666709793938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,32,0.014442667365074158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,16384,0.05735377470652262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,65536,0.22124177879757354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,51200,0.16451556152767605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,12288,0.04410755634307861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,10240,0.033878223763571844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,8192,0.02711733347839779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,768,65536,2.2331875695122614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,7168,0.022051556242836848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,10240,0.34547111723158097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,12288,0.43117332458496094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,8192,0.2796577877468533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,16384,0.5455982420179579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,5120,0.017158221867349412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,4096,0.013879111243618859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,7168,0.2460177739461263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,3584,0.012465777496496836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,6144,0.21539644400278726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,5120,0.17722045050726998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,4096,0.14076266023847792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,2560,0.010281778044170803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,2048,0.008587555752860175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,3584,0.120706664191352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,1536,0.007285333342022366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,3072,0.10134044620725845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,2560,0.08502133025063409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,1024,0.006239111224810283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,2048,0.06832800308863322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,768,0.005502222312821283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,1536,0.05156177613470289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,512,0.004584889031118817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,256,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,1024,0.036008887820773654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,768,0.02980177932315403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,128,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,512,0.023341332872708637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,64,0.003564444267087512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,256,0.01754133403301239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,51200,1.6794622209337022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,128,0.014515555567211576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,64,0.014116444521480136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,32,0.013768889009952545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,65536,0.16982844140794542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,6144,0.018979556030697294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,51200,0.13239999612172446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,16384,0.044491555955674916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,12288,0.035114665826161705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,512,65536,2.1498845418294272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,10240,0.029912889003753662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,8192,0.021143111917707656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,3072,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,7168,0.015062222878138224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,12288,0.3969928953382704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,10240,0.33333423402574325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,8192,0.26902132564120823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,5120,0.011037333144081963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,7168,0.23664977815416124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,4096,0.010101333260536194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,6144,0.2040248844358656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,512,32,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,5120,0.17071733209821913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,3584,0.009024000002278222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,3072,0.008452444440788692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,4096,0.1353706651263767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,2560,0.007314666277832455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,3584,0.11569244331783718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,3072,0.09697510798772176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,2048,0.006579555571079254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,1536,0.005888888819350137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,2560,0.08023733562893338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,1024,0.004936000125275718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,2048,0.06602133644951715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,51200,1.6157555050320094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,1536,0.04944711261325412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,768,0.004243555582231945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,512,0.0038933331767717996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,256,0.003571555432346132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,768,0.028549333413441975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,128,0.003216888962520493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,16384,0.5262835290696886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,256,0.01625155574745602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,65536,2.0621414184570312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,64,0.0031315556002987754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,32,0.0032391111469931076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,128,0.013800000150998434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,64,0.01314133322901196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,32,0.01273333364062839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,51200,0.07845511039098103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,16384,0.03131999903255039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,16384,0.514977773030599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,1024,0.03425511055522495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,12288,0.027793778313530818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,10240,0.016300444801648457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,256,6144,0.013092444174819522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,8192,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,7168,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,12288,0.3892524507310655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,10240,0.32663199636671275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,6144,0.010967999696731567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,8192,0.26405511962042916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,65536,0.09684533543056911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,7168,0.23186845249599883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,4096,0.007967111137178209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,3584,0.007559110720952352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,51200,1.5808568530612523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,6144,0.19988977909088135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,5120,0.16738311449686685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,3072,0.006945778098371293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,2560,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,4096,0.132149338722229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,3584,0.11355288823445638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,1536,0.004913777940803104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,3072,0.09490311145782471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,2560,0.07870311207241483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,1024,0.00423911131090588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,65536,2.023432837592231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,2048,0.06400977902942233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,512,0.0034942221310403612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,1536,0.04777600036727058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,256,0.0033288889875014624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,1024,0.03295911020702786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,256,512,0.022459555003378127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,128,0.0032053333189752367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,768,0.02801688843303257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,512,0.021951999929216173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,32,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,256,0.015819556183285184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,128,0.01312622262371911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,64,0.012502222425407834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,65536,0.09162488910886978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,128,32,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,51200,0.07589866717656453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,16384,0.030933333767784968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,5120,0.00943022221326828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,12288,0.02438933319515652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,10240,0.015486222174432544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,2048,0.005591111050711737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,12288,0.3885484536488851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,16384,0.5157217979431152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,8192,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,10240,0.3258204460144043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,7168,0.012476444244384766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,6144,0.01107022249036365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,768,0.003907555507289039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,5120,0.009409777820110321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,4096,0.008557333714432186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,7168,0.23192445437113443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,8192,0.2633484469519721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,128,64,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,6144,0.19997689459058973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,3584,0.007983999947706858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,3072,0.00702311098575592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,2560,0.0062977779242727495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,4096,0.1319217814339532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,2048,0.005601777798599667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,1536,0.005250666704442766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,3584,0.11321332719590928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,3072,0.09434844387902154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,2560,0.07810488674375746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,2048,0.06390133168962267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,1024,0.004520888957712385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,768,0.003993777765168084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,512,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,1536,0.047854221529430814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,256,0.0032275555034478507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,1024,0.032935112714767456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,128,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,768,0.027752000424597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,512,0.02159022291501363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,51200,1.580529742770725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,64,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,64,32,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,256,0.01550044450494978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,128,0.013083555632167392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,64,0.012123555772834353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,65536,0.0905253357357449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,51200,0.07373511128955416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,16384,0.028055111567179363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,65536,2.0214292738172746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,12288,0.020592888196309406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,10240,0.012625777886973487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,5120,0.16679022047254774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,8192,0.011149333582984077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,12288,0.3887600104014079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,10240,0.32611555523342556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,16384,0.5156222449408637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,7168,0.011040888726711273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,6144,0.01035288886891471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,5120,0.009552888572216034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,8192,0.2634435494740804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,7168,0.23162844445970324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,6144,0.19954221778445771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,3584,0.00796888851457172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,5120,0.16733511288960776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,3072,0.008616000413894653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,64,32,0.012090666426552666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,4096,0.13180532720353869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,3584,0.11436800161997478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,3072,0.09532711240980361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,2560,0.07882133457395765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,1536,0.004892444445027245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,51200,1.579885376824273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,1024,0.0039057777159743835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,768,0.003548444559176763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,1536,0.04759733213318718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,1024,0.03295466634962294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,512,0.0035342222286595237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,768,0.02776977750990126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,256,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,65536,2.019918229844835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,512,0.021588444709777832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,256,0.015459555718633862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,64,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,32,0.002797333316670524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,128,0.01311555587583118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,64,0.012224888636006249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,4096,0.008303110798199972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,32,0.012028444144460889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,2560,0.007261333366235097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,2048,0.0052266667286554975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4353,32,2048,0.0640631119410197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4353,32,128,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,12288,3.9787173800998263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,16384,5.363337622748481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,12288,4.6866230434841585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,16384,6.666714562310113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,16384,6.290492587619358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,10240,3.5921724107530384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,10240,3.8530684577094187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,12288,4.450460645887587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,8192,2.800789303249783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,10240,3.7097981770833335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,8192,3.047807057698568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,7168,2.5366639031304254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,8192,2.8861378563774953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,7168,2.5750204722086587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,6144,2.162236531575521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,7168,2.615072038438585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,6144,2.159595489501953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,5120,1.8397725423177083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,6144,2.2236781650119357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,51200,16.73132832845052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,5120,1.9032062954372828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,4096,1.4343342251247828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,5120,1.8728968302408855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,4096,1.4701093037923176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,3584,1.1828301747639973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,3584,1.3146933449639213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,4096,1.4632559882269964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,3072,1.1150346332126193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,3584,1.3067760467529297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,3072,1.0815138287014432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,2560,0.8601199785868326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,2048,0.7781279881795248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,2048,0.7488728629218208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,2560,0.9444079928927951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,3072,1.0763013627794054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,1024,0.36847199334038633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,2560,0.9408906300862631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,1536,0.6306986808776855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,2048,0.7773768636915418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,1536,0.593290646870931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,1536,0.571922673119439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,768,0.32226400905185276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,1024,0.5654737684461806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,768,0.3490791055891249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,1024,0.44681866963704425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,512,0.22835556666056314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,768,0.358334223429362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,256,0.1598177750905355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,512,0.28102487987942165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,512,0.3545360035366482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,256,0.32887999216715497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,256,0.22233332528008354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,64,0.11484711700015598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,128,0.16931022538079155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,128,0.24790755907694498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,32,0.10280266735288833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,64,0.25443021456400555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,32,0.2586737738715278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,65536,128,0.11911822689904107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,65536,51200,20.057349310980904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,65536,51200,28.254199557834202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,16384,4.103271908230252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,16384,5.419071197509766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,51200,12.88114759657118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,16384,4.934305826822917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,12288,3.1890133751763234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,65536,16.624957614474827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,12288,3.7670762803819446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,10240,2.7669012281629772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,12288,3.582821316189236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,10240,3.09295294019911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,10240,2.9803769853379993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,8192,2.1862960391574435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,51200,16.71013726128472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,8192,2.427433861626519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,51200,21.94815233018663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,7168,1.9816025627983942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,8192,2.39573245578342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,7168,2.1056285434299045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,6144,1.6336960262722438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,5120,1.3562755584716797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,6144,1.8436942630343969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,7168,2.0222256978352866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,5120,1.486703978644477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,6144,1.8331546783447266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,4096,1.03712887234158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,5120,1.449196391635471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,4096,1.1520399517483182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,3584,0.8843217955695258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,4096,1.1787652969360352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,3072,0.7967262268066406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,65536,21.591949462890625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,3584,1.0332746505737305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,3072,0.8629315694173177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,2560,0.6633377605014378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,3584,1.0164035161336262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,2048,0.5370800230238173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,3072,0.8869235780504016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,2048,0.5996746487087673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,1536,0.4302862220340305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,2560,0.7958889007568359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,1024,0.2689564492967394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,1536,0.5846471256679958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,2560,0.7398968802558051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,2048,0.63628265592787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,1536,0.5011990865071615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,768,0.2111795610851712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,1024,0.35350932015313047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,1024,0.5179928673638238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,512,0.16300088829464382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,256,0.11354933844672309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,768,0.2950177722507053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,65536,29.209238688151043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,768,0.2968222300211589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,512,0.27525332238939076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,128,0.09274578094482422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,256,0.19200710455576578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,64,0.07923644118838839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,51200,32,0.07963644133673774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,256,0.24364354875352648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,51200,128,0.1449484427769979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,512,0.239848878648546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,128,0.19773599836561415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,64,0.2130568954679701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,51200,32,0.20596444606781006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,16384,1.3855884340074327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,16384,2.0438018374972873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,12288,1.0051395628187392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,16384,2.065399169921875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,51200,4.281469133165148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,12288,1.4456124835544164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,10240,0.9882435268825955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,65536,5.47727288140191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,12288,1.4900675879584417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,8192,0.8551715744866265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,10240,1.1902124616834853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,7168,0.6270764668782552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,8192,0.9521652857462565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,10240,1.201459566752116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,8192,0.9641528659396701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,51200,6.605222913953994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,7168,0.8339777522616916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,6144,0.5160711076524522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,7168,1.1594390869140625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,51200,8.551172044542101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,5120,0.4581751293606228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,6144,0.7474213176303439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,5120,0.5840097533331977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,4096,0.348831123775906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,6144,0.7224257787068685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,5120,0.6625279850429958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,3584,0.29200532701280385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,4096,0.45503997802734375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,4096,0.4891733593410916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,3584,0.41081423229641384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,3072,0.2415235572391086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,2560,0.21880622704823813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,3072,0.34069511625501847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,3584,0.43497599495781797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,2048,0.16608533594343397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,2560,0.296799103418986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,3072,0.3715777662065294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,65536,10.195084465874567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,2560,0.33930132124159074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,65536,8.535080803765192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,2048,0.23712976773579916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,1024,0.09125066465801662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,2048,0.26145156224568683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,768,0.08127644326951769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,1536,0.18713333871629503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,512,0.0570017761654324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,768,0.12407910823822021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,1024,0.19382754961649576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,256,0.04040888945261637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,512,0.10378044181399876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,512,0.09215911229451497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,128,0.03237777617242601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,256,0.08132177591323853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,256,0.08246666855282254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,64,0.02882222334543864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,128,0.07340800099902682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,128,0.06209777461157905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,32,0.029845333761639063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,64,0.07566222217347887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,32,0.07597600089179145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,16384,1536,0.1299804449081421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,1536,0.20801688565148246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,16384,1024,0.14194133546617296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,16384,1.0936604605780709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,16384,768,0.12957244449191624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,51200,3.1979315016004772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,16384,1.6328230963812933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,16384,1.7069786919487848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,12288,0.8535982237921821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,65536,4.369185977511935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,12288,1.1671866310967338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,10240,0.6689955393473307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,10240,0.9779609044392904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,8192,0.620355553097195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,12288,1.2432230843438041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,8192,0.7552080154418945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,7168,0.4740497801038954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,10240,1.0032417509290907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,6144,0.3897253407372369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,51200,6.597085316975911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,8192,0.8918115827772352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,7168,0.6601395606994629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,51200,5.386003706190322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,5120,0.3389591111077203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,7168,0.8735226525200738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,6144,0.6328648991054958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,5120,0.4733324580722385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,4096,0.30042576789855957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,3584,0.22507733768886992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,6144,0.6358302434285482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,4096,0.37949421670701766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,5120,0.5373653305901421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,4096,0.42905865775214297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,3072,0.20474489529927573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,65536,8.132369147406683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,3584,0.4505910873413086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,2560,0.1724604500664605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,3072,0.2798159917195638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,3584,0.37795199288262266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,2048,0.14121245013342962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,3072,0.32770223087734646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,2560,0.24698400497436523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,65536,6.996264987521702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,1536,0.10730489095052083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,2560,0.29096444447835285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,2048,0.1951893303129408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,1024,0.07294311126073201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,768,0.05731022357940674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,2048,0.22337423430548775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,1536,0.18215110566880968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,512,0.04126311010784573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,1536,0.1783155600229899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,1024,0.13633155822753906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,256,0.03161333335770501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,768,0.11230044894748265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,768,0.09324800305896336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,1024,0.12338756190405951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,512,0.07526933484607272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,512,0.09654844469494289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,128,0.026347556047969397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,256,0.0681413345866733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,256,0.06375466452704535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,32,0.023748444186316595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,12288,64,0.022680888573328655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,12288,128,0.05505688985188802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,128,0.059340443876054555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,64,0.06123555368847317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,12288,32,0.06005689170625475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,16384,0.9137261708577474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,51200,2.7776764763726125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,16384,1.4262195163302953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,65536,3.378851572672526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,12288,0.6364089118109809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,12288,1.0203271441989474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,10240,0.5949715508355035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,16384,1.501952913072374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,8192,0.46188444561428493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,12288,1.1101244820488823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,10240,0.8487520217895508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,7168,0.3888293372260199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,51200,5.578447129991319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,8192,0.8145119878980848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,10240,1.0105760362413194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,8192,0.7403564453125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,51200,4.849031236436632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,6144,0.32810044288635254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,7168,0.6378515561421713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,5120,0.28294844097561306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,6144,0.5110595491197374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,7168,0.6732248730129666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,4096,0.2190284464094374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,5120,0.4434719880421956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,6144,0.5633378028869629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,4096,0.3367679913838704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,3584,0.20831288231743705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,3072,0.16067643960316977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,3584,0.3001822100745307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,4096,0.3842257658640544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,3584,0.33641333050198025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,2560,0.13319910897148982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,3072,0.30396800571017796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,65536,7.421837700737847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,2048,0.10716444253921509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,3072,0.29036090109083385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,65536,6.365506490071614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,1536,0.08523022466235691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,2560,0.24620445569356283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,1024,0.06396889024310641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,2048,0.18497955799102783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,2048,0.23069334030151367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,1536,0.13636088371276855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,768,0.04751999841796028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,1536,0.18904711140526664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,512,0.03407999873161316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,1024,0.1259253289964464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,768,0.10166933139165242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,256,0.03227644496493869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,512,0.08702044354544745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,5120,0.4817608727349176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,128,0.023766222927305434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,256,0.06288622485266791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,256,0.056240889761182994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,64,0.019318222999572754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,10240,32,0.019310222731696237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,10240,128,0.0500311123000251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,128,0.0514959990978241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,64,0.05158133308092753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,32,0.052263110876083374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,2560,0.2116924391852485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,1024,0.1021253334151374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,768,0.08376799689398871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,10240,512,0.06783822509977552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,16384,0.7064231236775717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,51200,2.1847288343641496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,65536,2.8676071166992188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,12288,0.5517839855617946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,16384,1.3519795735677083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,16384,1.2239768770005968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,12288,0.9140489366319445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,12288,0.9991582234700521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,10240,0.7430319786071777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,8192,0.3655342260996501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,10240,0.8382444381713867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,51200,4.611649831136067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,8192,0.5911688804626465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,10240,0.45900265375773114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,7168,0.3305902216169569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,6144,0.276104900572035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,8192,0.7000648710462781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,7168,0.5323404206169976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,51200,4.236742231580946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,7168,0.5875022146436903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,5120,0.216630220413208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,65536,5.923739539252387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,6144,0.4881084230211046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,4096,0.18188622262742785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,6144,0.5148408677842882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,5120,0.3763253423902724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,3584,0.16256354914771184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,4096,0.31189245647854275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,5120,0.43483734130859375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,4096,0.354111115137736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,3072,0.13671822018093532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,65536,5.50077141655816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,3584,0.25816355811225045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,3072,0.2247413264380561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,3584,0.3019813431633843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,2048,0.0971662203470866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,3072,0.2625359959072537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,2560,0.21676977475484213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,1536,0.07724266582065158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,1024,0.054309331708484225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,2048,0.18325066566467285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,2048,0.15358577834235296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,1536,0.12003289328681098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,1536,0.1527973281012641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,1024,0.09464799695544773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,1024,0.10985955264833237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,512,0.03024266825781928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,768,0.07165333297517565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,768,0.09540088971455891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,256,0.021254221598307293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,512,0.05838221973843045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,512,0.07570666737026639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,128,0.01793688866827223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,256,0.049582223097483315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,256,0.05537866552670797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,64,0.015464888678656684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,32,0.01590844492117564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,128,0.04419111212094625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,128,0.043904887305365674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,64,0.04286311070124308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,2560,0.11104355255762736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,8192,32,0.043113778034845986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,8192,2560,0.23707911703321669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,8192,768,0.04096711013052199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,16384,0.6425555547078451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,16384,1.124251577589247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,51200,2.2414578331841364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,12288,0.48901690377129453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,65536,2.779936048719618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,16384,1.2639137903849285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,10240,0.4285324414571126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,12288,0.8492950863308377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,10240,0.6850746472676595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,12288,0.949228392706977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,8192,0.31037865744696724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,7168,0.28763998879326713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,8192,0.5470550855000814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,10240,0.812156465318468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,51200,4.226507398817274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,6144,0.2307466665903727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,7168,0.5322684182061089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,5120,0.19451822174919975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,7168,0.5572906600104438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,6144,0.42700711886088055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,51200,3.952545589870877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,4096,0.15050400627983943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,6144,0.5222773551940918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,5120,0.36054666837056476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,65536,5.433597140842014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,5120,0.40687910715738934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,3584,0.1312319967481825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,4096,0.27782487869262695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,4096,0.3276488780975342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,3072,0.12309511502583821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,8192,0.6314702033996582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,3584,0.24107556872897676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,2560,0.1018213364813063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,3072,0.20747733116149902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,2048,0.07635911305745442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,3584,0.31745955679151744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,3072,0.24752532111273873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,1536,0.06012800004747179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,1024,0.04497155547142029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,2048,0.14096089204152426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,2048,0.17539821730719674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,1536,0.11387377315097386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,1536,0.13817689153883192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,768,0.03569511241383023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,512,0.025966222087542217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,1024,0.10403733121024238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,768,0.08671200275421143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,768,0.06679733594258626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,256,0.019472888774342008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,512,0.06946311394373576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,512,0.05390488770272997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,128,0.016727111405796476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,256,0.05224800109863281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,64,0.016120889120631747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,128,0.038035555018319026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,7168,32,0.016364443633291457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,64,0.03748355640305413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,32,0.0366231103738149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,2560,0.17197777165306938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,2560,0.2085813283920288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,65536,5.08161883884006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,1024,0.08291555775536431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,7168,256,0.043261332644356616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,7168,128,0.04161244299676683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,16384,0.5421413315667046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,51200,1.5704711278279622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,65536,2.2596026526557074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,12288,0.44106221199035645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,16384,1.071929825676812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,10240,0.366504881117079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,12288,0.7643271022372775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,16384,1.2108195622762044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,8192,0.2841457790798611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,12288,0.9333680470784506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,10240,0.7508737776014539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,10240,0.7516240013970269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,8192,0.5282355414496528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,7168,0.23665245374043783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,51200,3.8477350870768228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,8192,0.6088177892896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,6144,0.20537777741750082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,7168,0.44588979085286456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,5120,0.176966216829088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,6144,0.3909280035230849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,65536,4.7257741292317705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,7168,0.5403360260857476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,4096,0.1291173299153646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,6144,0.4638373586866591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,51200,3.745787726508247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,4096,0.2554017702738444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,5120,0.42470489607916934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,3072,0.08845422003004287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,4096,0.31427110566033256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,3584,0.21836445066663954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,2560,0.08633955319722493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,3584,0.2744053204854329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,3072,0.19599289364284941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,2048,0.07123021947013007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,3072,0.23764443397521973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,2560,0.15910666518741184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,65536,4.788476308186849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,1536,0.05462400118509928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,2560,0.2007217804590861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,1024,0.03991377684805129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,2048,0.13259288999769422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,2048,0.16577066315544978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,768,0.028510222832361858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,1536,0.10246755679448445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,1536,0.13279378414154053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,1024,0.0765297810236613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,1024,0.09976177745395237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,512,0.021409778131379023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,256,0.01684711045689053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,768,0.06078222062852648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,768,0.08433333370420669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,128,0.014197332991494073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,512,0.06651644574271308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,512,0.048531555467181735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,256,0.04950044552485148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,256,0.03758222195837233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,64,0.012030222349696688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,5120,0.3199226591322157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,3584,0.11299910810258652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,6144,32,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,128,0.03537866804334853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,6144,128,0.0385484430525038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,64,0.03304622239536709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,6144,32,0.03253333436118232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,16384,0.46802579032050234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,16384,0.9508266448974609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,51200,1.608639081319173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,12288,0.3649262322319879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,65536,1.853560977511936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,16384,1.1313795513576932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,10240,0.2972755432128906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,12288,0.7220586670769585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,8192,0.22327200571695963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,10240,0.5792115529378256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,12288,0.854880862765842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,7168,0.21753866142696807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,10240,0.7371022436353895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,8192,0.4946782324049208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,8192,0.5713546541002061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,51200,3.355457729763455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,6144,0.16379111342959934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,7168,0.4217102262708876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,5120,0.1331617832183838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,7168,0.5054444207085503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,6144,0.35163288646274143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,5120,0.3012559943728977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,4096,0.11721600426567926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,6144,0.4440915584564209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,3584,0.10070844491322835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,51200,3.4939484066433377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,5120,0.3829475508795844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,3072,0.08803821934594049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,4096,0.2317919996049669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,65536,4.201350318060981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,4096,0.296341339747111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,2560,0.06795555353164673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,3584,0.20125155978732637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,3584,0.2596302297380236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,3072,0.17278577221764457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,2048,0.058816889921824135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,3072,0.22184267308976915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,1536,0.04706222150060865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,2560,0.14453332953982884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,2560,0.18716266420152453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,1024,0.032221333848105535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,2048,0.1194559997982449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,2048,0.1576746702194214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,1536,0.12456799878014459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,768,0.023009777069091797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,512,0.018008000320858426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,1024,0.09342755873998006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,1024,0.06976799832450019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,768,0.055585775110456676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,256,0.014161777165200977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,768,0.07794488800896539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,512,0.04356088903215197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,512,0.06237600247065226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,256,0.04522044459978739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,65536,4.5219065348307295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,256,0.03374044431580438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,64,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,32,0.012749333348539142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,128,0.03044355577892727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,64,0.03018666638268365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,32,0.02949955397182041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,5120,1536,0.0939448873202006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,5120,128,0.014744000302420722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,51200,1.0608897738986545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,5120,128,0.03598755598068237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,65536,1.4396817949083116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,16384,0.37202755610148114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,12288,0.2839333216349284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,16384,0.8610053592258029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,12288,0.6591946813795302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,16384,1.0522178014119465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,10240,0.22704267501831055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,12288,0.8098630905151367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,8192,0.1870675616794162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,10240,0.5244684219360352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,7168,0.15938222408294678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,8192,0.4317733446756999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,10240,0.662609789106581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,8192,0.5793502065870497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,6144,0.1416862275865343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,7168,0.37119377983940977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,51200,2.9466150071885853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,5120,0.1095857752694024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,65536,3.6458863152398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,7168,0.4746524492899577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,6144,0.3238382339477539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,4096,0.08852266603045994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,6144,0.40945688883463544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,3584,0.07741777764426337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,5120,0.2761724525027805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,5120,0.34409512413872617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,3072,0.0649048884709676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,4096,0.20997333526611328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,4096,0.27488356166415745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,3584,0.1824737787246704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,3584,0.24109511905246309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,3072,0.15522755516899958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,51200,3.240489747789171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,3072,0.20873955885569254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,2048,0.046794666184319385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,1536,0.03575999869240655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,2560,0.13065511650509304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,2560,0.17515022224850127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,1024,0.02437777817249298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,2048,0.1067804429266188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,2048,0.1450444459915161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,1536,0.08558044168684219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,1536,0.11722577942742242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,768,0.019627556204795837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,65536,4.156576792399089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,512,0.015080889066060385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,1024,0.06219644678963555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,1024,0.08727733294169109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,256,0.01186222251918581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,768,0.07307644685109456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,128,0.011015111373530494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,512,0.0377475553088718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,512,0.057971556981404625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,256,0.029230223761664495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,256,0.04316888915167915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,64,0.009336888790130615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,32,0.00977955593003167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,128,0.026779555612140234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,64,0.025734222597546045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,32,0.02581688927279578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,4096,2560,0.050887998607423574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,4096,768,0.04945955673853556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,51200,1.1642355389065213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,65536,1.346236440870497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,4096,128,0.03296355406443278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,16384,0.3355333275265164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,12288,0.2636551062266032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,16384,0.9495759540134006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,16384,1.018839094373915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,12288,0.6264799965752496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,10240,0.23379911316765678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,51200,2.6383465660942926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,8192,0.17343110508388945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,10240,0.5008106761508518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,12288,0.7627200020684136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,7168,0.15503999922010633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,8192,0.4017359945509169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,65536,3.418047163221571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,6144,0.12135822243160671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,10240,0.6511804262797037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,7168,0.35328088866339785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,8192,0.5211502181159126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,5120,0.11178844504886204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,4096,0.08537066645092434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,51200,3.120285246107313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,6144,0.30386310153537327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,7168,0.4541341993543837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,5120,0.2538115448421902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,6144,0.3934924337599013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,3584,0.08062044117185804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,5120,0.3324311044481066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,3072,0.06843022505442302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,4096,0.2004835605621338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,3584,0.17341600524054634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,2560,0.052694221337636314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,4096,0.26388978958129883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,3072,0.14729421668582493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,3584,0.23167644606696236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,1536,0.03489955597453647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,3072,0.19951377974616158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,2560,0.123508440123664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,65536,3.9917831420898438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,2560,0.167921781539917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,1024,0.0219217770629459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,2048,0.14058666759067112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,768,0.018301332990328472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,1536,0.080622222688463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,1536,0.11220444573296441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,1024,0.08435822195476955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,1024,0.05840088923772176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,512,0.016027554869651794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,768,0.07031999693976508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,768,0.0461751123269399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,256,0.012715555727481842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,128,0.010673777924643623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,512,0.054634667105144925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,512,0.03605422377586365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,256,0.027458666099442378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,64,0.008963555925422246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,256,0.040185779333114624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,128,0.02502222193611993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3584,128,0.032574223147498235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,32,0.009335111412737105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,64,0.024345777100986902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,32,0.023941333095232647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3584,2048,0.04381600022315979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3584,2048,0.10119822290208604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,16384,0.2641173203786214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,51200,0.8976977666219076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,65536,1.0679492950439453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,12288,0.2446355554792616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,16384,0.744958241780599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,12288,0.6154213481479222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,10240,0.17025155491299102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,16384,0.9725155300564237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,8192,0.14536000622643366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,12288,0.8438160154554578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,10240,0.4748524559868707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,7168,0.12097067303127712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,10240,0.6658666928609213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,51200,2.4481146070692277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,8192,0.3805253240797255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,6144,0.10114666488435532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,8192,0.5018729103936089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,7168,0.33471377690633136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,5120,0.09230844179789226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,6144,0.28829065958658856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,7168,0.439683543311225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,4096,0.07071733474731445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,65536,3.1376079983181424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,6144,0.3789217736985948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,5120,0.24041777186923555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,3584,0.053278221024407275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,5120,0.32007021374172634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,3072,0.052984890010621816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,4096,0.19059467315673828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,4096,0.2541217803955078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,2560,0.046463999483320445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,3584,0.1649671130710178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,3584,0.22235467698838976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,2048,0.03618844350179037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,3072,0.1401102277967665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,3072,0.19203733073340523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,1536,0.027449778384632532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,2560,0.11699733469221328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,2560,0.16266844007703993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,2048,0.13493422667185465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,1024,0.01974933346112569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,1536,0.07412177986568876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,1536,0.10730044709311591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,768,0.015740444262822468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,1024,0.08051377534866333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,1024,0.05472177929348416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,512,0.01236177815331353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,65536,3.8349893358018665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,768,0.06806577576531304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,256,0.009658666948477427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,512,0.03344088792800903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,128,0.008750222623348236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,256,0.02574399941497379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,256,0.0399582220448388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,64,0.00793333351612091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,128,0.023099554909600153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,128,0.03154044349988302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,51200,2.99198489718967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,64,0.022288888692855835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,32,0.022280888424979314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,2048,0.09672177500194973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,3072,768,0.04275644487804837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,3072,512,0.052347554100884326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,65536,1.081573380364312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,16384,0.25171200434366864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,3072,32,0.00867555538813273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,51200,0.7883049117194282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,12288,0.18140444490644667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,16384,0.7514710956149631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,12288,0.6003582212660048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,10240,0.15032000011867946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,16384,0.9364088906182183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,12288,0.7051919831169976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,8192,0.13725599977705213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,10240,0.4501315752665202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,7168,0.11400266488393147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,8192,0.35969066619873047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,10240,0.5925111240810818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,51200,2.2872897254096136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,6144,0.09635733233557807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,65536,2.92268795437283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,8192,0.4899804327223036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,7168,0.3175120088789198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,5120,0.07527733511394925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,4096,0.06202310985989041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,7168,0.4211111068725586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,6144,0.2732711103227404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,5120,0.22826043764750162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,6144,0.36442134115431046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,3584,0.056927998860677086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,5120,0.3068293465508355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,3072,0.04868622289763557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,4096,0.24467288123236763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,3584,0.1565262211693658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,2560,0.04156000084347195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,3584,0.21356444888644746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,3072,0.1323875586191813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,2048,0.034458667039871216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,3072,0.18404622872670492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,51200,2.872112062242296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,1536,0.027628444963031348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,2560,0.11043110820982192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,2560,0.15579999817742243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,1024,0.016881777180565726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,2048,0.09102577633327907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,2048,0.1298933294084337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,768,0.014153778553009033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,1536,0.06935822301440768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,1536,0.10314310921563043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,1024,0.07750133011076185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,512,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,256,0.00904088881280687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,768,0.04010666741265191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,768,0.0653911100493537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,512,0.031164444155163232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,128,0.007947555846638149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,512,0.051615112357669406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,256,0.03871999846564399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,128,0.030421333180533514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,128,0.02146222194035848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,32,0.009310222334331935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,64,0.020596444606781006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,32,0.02034311162100898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,4096,0.1806968847910563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,65536,0.6588960223727757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,51200,0.5381306542290581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2560,65536,3.6730558607313366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,1024,0.051217777861489185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,16384,0.17904444535573324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2560,64,0.007233777807818518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,12288,0.13527466191185847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,16384,0.6632764604356554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,12288,0.5007368723551432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,10240,0.11575555801391602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2560,256,0.023801777097913954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,10240,0.41986666785346133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,8192,0.09237422545750935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,65536,2.678056081136068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,51200,2.1043084462483725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,10240,0.5678364435831705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,8192,0.3388693332672119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,7168,0.08398755391438802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,16384,0.893190171983507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,6144,0.07042133145862155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,8192,0.4586186408996582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,7168,0.29836977852715385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,5120,0.056299553977118603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,12288,0.6763280232747396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,7168,0.40439555380079484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,6144,0.25740710894266766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,4096,0.044277333550983004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,65536,3.4925439622667103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,5120,0.21488532755109999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,6144,0.34925421078999835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,3584,0.03941422369745042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,5120,0.2949919965532091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,4096,0.16992178228166369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,3072,0.03369333346684774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,4096,0.23460178905063203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,2560,0.029263999727037217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,3584,0.14662044578128391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,3584,0.20505332946777344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,2048,0.024849777420361836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,3072,0.12436710463629828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,2560,0.10373600323994954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,1536,0.01959022217326694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,2048,0.08507111337449814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,2048,0.12487644619411892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,1024,0.014098667436175875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,1536,0.09895200199551052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,1536,0.06515466504626803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,768,0.012141333685980903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,1024,0.04559377829233805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,1024,0.0737173358599345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,512,0.009336888790130615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,768,0.03781333234575059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,256,0.007280000381999546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,512,0.02905155552758111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,512,0.04798577891455757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,51200,2.739953782823351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,128,0.006607111129495833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,256,0.022307554880777996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,64,0.00600000015563435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,256,0.03608444333076477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,2048,32,0.006618666566080517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,128,0.01955200069480472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,64,0.018937778141763475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,2048,32,0.018882667024930317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,3072,0.17682488759358725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,2560,0.1496115525563558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,65536,0.5455742412143284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,51200,0.42708622084723574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,16384,0.13690400123596191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,768,0.062257779969109424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,12288,0.10293955273098415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,2048,128,0.02942044536272685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,16384,0.6791031095716688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,10240,0.09336088763342963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,12288,0.47133779525756836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,16384,0.8782124519348145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,8192,0.07748711109161377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,10240,0.3976142141554091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,12288,0.6464231279161241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,7168,0.06643111175960965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,10240,0.5430311097039117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,8192,0.3206453323364258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,51200,1.9625769721137152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,6144,0.05859111415015327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,7168,0.28194578488667804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,65536,2.507965299818251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,5120,0.04389333393838671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,7168,0.386784897910224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,6144,0.24290755059983996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,4096,0.034274667501449585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,6144,0.3349768850538466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,3584,0.0317191117339664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,5120,0.20359555880228677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,5120,0.2815439965989855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,3072,0.02754577828778161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,4096,0.16147111521826849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,4096,0.22464177343580458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,2560,0.02346399923165639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,3584,0.1395217842525906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,51200,2.615974214341905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,3584,0.19611999723646376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,2048,0.019714666737450492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,3072,0.11726400587293838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,3072,0.16844533549414742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,1536,0.015288889408111572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,2560,0.09814844528834026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,2560,0.14284000131818983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,2048,0.08005688587824504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,1024,0.011529777612951068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,2048,0.11896355946858723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,768,0.009662222531106737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,1536,0.09516177574793498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,512,0.00792711145348019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,65536,3.3429031372070312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,1024,0.07083911365932889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,768,0.034520887666278414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,768,0.05789866712358263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,8192,0.43869688775804305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,512,0.027444443768925134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,512,0.04726577798525492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,128,0.005587555468082428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,256,0.020635555187861126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,256,0.03530222177505493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,64,0.0053671110007498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,32,0.005230222311284807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,128,0.017841777867741056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1536,128,0.02832888894610935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,64,0.017543110582563613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,32,0.017511111166742113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,65536,0.3659359878963894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,51200,0.28477599885728627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,1536,0.06283911069234212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1536,1024,0.043154666821161904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,16384,0.0932568907737732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1536,256,0.006230222268237009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,12288,0.07237066825230916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,16384,0.5866506894429525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,12288,0.44334843423631454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,10240,0.0606479975912306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,16384,0.8166524569193522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,12288,0.6191235648261176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,8192,0.051798221137788564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,10240,0.37186400095621747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,7168,0.040744000011020236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,8192,0.3000560071733263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,10240,0.518812444474962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,51200,1.8164772457546656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,6144,0.03586666782697042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,65536,2.3112515343560114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,8192,0.4198124408721924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,5120,0.030272887812720403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,7168,0.2641208966573079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,4096,0.02432800001568264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,6144,0.2280977831946479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,7168,0.37029245164659286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,5120,0.1907635529836019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,6144,0.320126215616862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,3584,0.02272622287273407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,5120,0.26926665835910374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,3072,0.019295111298561096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,4096,0.1504462162653605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,4096,0.2150355577468872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,2560,0.016869333055284288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,3584,0.13050044907463923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,3584,0.18731289439731172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,3072,0.10920800103081597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,2048,0.014548444085650973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,3072,0.1610328886244032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,1536,0.011800888511869641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,2560,0.09151111046473186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,1024,0.009371555513805812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,2048,0.07459288835525513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,2048,0.1127857764561971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,1536,0.05731199847327339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,1536,0.09052177932527329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,768,0.007999999655617608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,65536,3.1923885345458984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,512,0.006595555692911148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,1024,0.0399617784553104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,1024,0.06567022535536024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,256,0.0053297777970631914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,768,0.05544799897405836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,512,0.044172445933024086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,512,0.025363556212849084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,256,0.03337422344419692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,256,0.018886221779717337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,64,0.004515555583768421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,32,0.004512888689835866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,128,0.016350222958458793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,128,0.026605332891146343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,64,0.015471999843915304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,32,0.015125332607163323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,65536,0.2989768981933594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,51200,0.23345510164896646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,51200,2.4989679124620223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,1024,2560,0.13662400510576037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,16384,0.07579911417431302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,1024,768,0.031903998719321355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,1024,128,0.004836444639497333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,12288,0.057088891665140785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,16384,0.5661830902099609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,10240,0.04871288935343424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,16384,0.813061343299018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,12288,0.4282737837897406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,8192,0.03862488932079739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,12288,0.6165768835279677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,10240,0.35889511638217503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,7168,0.03231911195649041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,8192,0.29029154777526855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,51200,1.7458648681640625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,10240,0.5166115760803223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,6144,0.027913779020309448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,7168,0.25508801142374676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,65536,2.2273875342475042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,8192,0.4180764357248942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,5120,0.023755555351575215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,7168,0.368064006169637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,6144,0.21997333897484672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,4096,0.019309333629078336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,6144,0.3185093402862549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,3584,0.017633777525689866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,5120,0.26885422070821124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,4096,0.14553244908650717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,3072,0.015631111131774057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,4096,0.21319111188252768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,3584,0.1256506707933214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,2560,0.01352533366945055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,3584,0.18630488713582358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,51200,2.495008044772678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,2048,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,3072,0.1054346693886651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,3072,0.16062933868832058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,1536,0.009704888694816166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,2560,0.08771289057201809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,2560,0.13571733898586696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,1024,0.007855110698276097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,2048,0.07195999887254503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,2048,0.11296178234948052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,65536,3.1828844282362194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,768,0.006777777853939269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,1536,0.05489066574308607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,1536,0.09033955468071832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,512,0.005838222387764189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,1024,0.06560533576541476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,768,0.055175999800364174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,256,0.004872888740566042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,768,0.030877331892649334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,512,0.04391910963588291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,512,0.024336000283559162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,128,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,64,0.0041759999261962045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,256,0.03290311164326138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,256,0.01791200041770935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,768,32,0.004212444441186057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,768,128,0.02641333308484819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,128,0.015635554989178974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,5120,0.184005339940389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,64,0.01479022204875946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,32,0.01477777792347802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,65536,0.21785777144961885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,51200,0.1671146684222751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,16384,0.05455288953251309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,16384,0.5453271336025661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,12288,0.041159109936820135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,768,1024,0.03787111242612203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,10240,0.0374017788304223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,16384,0.7856222258673774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,12288,0.41161423259311253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,10240,0.34529688623216415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,8192,0.027601778507232666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,12288,0.5888240072462294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,7168,0.022290666898091633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,10240,0.4950426419576009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,51200,1.6783271365695531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,6144,0.019380443625979953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,8192,0.27948088116115993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,8192,0.39934576882256406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,5120,0.01738222274515364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,7168,0.35243911213344997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,6144,0.21193510956234404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,4096,0.014083556003040738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,6144,0.30471645461188424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,5120,0.1775733364952935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,3584,0.012774222426944308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,5120,0.257081773546007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,4096,0.14012000295850965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,51200,2.374880048963759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,4096,0.20441688431633842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,3584,0.12081333001454671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,2560,0.010087110930018956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,3584,0.17821244398752847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,3072,0.10117689106199478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,3072,0.15284355481465658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,2048,0.008933333059151968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,2560,0.0837635530365838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,2560,0.1294133398267958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,65536,3.034510294596354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,2048,0.10788977808422512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,1024,0.005959110955397288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,1536,0.05140622125731575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,7168,0.24595999717712402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,1536,0.08611377742555405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,768,0.0052764444715446895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,65536,2.1449574364556208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,1024,0.036306666003333196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,1024,0.06195466385947334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,512,0.004619555754794015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,768,0.05269777774810791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,768,0.02947910957866245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,512,0.04225777917438083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,512,0.02330844435426924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,128,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,256,0.03156355685657925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,256,0.01720888912677765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,64,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,512,128,0.024891555309295654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,128,0.01479288935661316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,3072,0.011260444091426002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,32,0.0036275556517971885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,64,0.01407999959256914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,32,0.013793778088357715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,65536,0.15017599529690212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,51200,0.11270044909583198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,1536,0.007689778175618913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,16384,0.036304887798097395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,512,2048,0.06863022512859769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,512,256,0.004226666771703296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,12288,0.027424888478385076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,16384,0.5246755811903212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,16384,0.7709964646233453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,10240,0.022843556271659002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,12288,0.3970497714148627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,8192,0.01681866745154063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,12288,0.5853110949198405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,51200,1.6125475565592449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,10240,0.33316532770792645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,7168,0.014428445034556918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,8192,0.2691475550333659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,10240,0.4904986487494574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,65536,2.062538570827908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,7168,0.23625421524047852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,8192,0.39678488837348086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,5120,0.011005333728260465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,7168,0.3495937718285455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,6144,0.2038053274154663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,4096,0.009352000223265754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,6144,0.302877320183648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,5120,0.17104000515407988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,3584,0.008960888617568547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,5120,0.25502488348219127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,3072,0.00777333312564426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,4096,0.13506044281853571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,51200,2.3587883843315973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,4096,0.2036177714665731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,2560,0.007274666594134436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,3584,0.11607200569576687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,3584,0.17694666650560167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,2048,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,3072,0.09689333041508992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,1536,0.00554666668176651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,3072,0.152218672964308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,2560,0.08003555403815375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,2560,0.12825066513485378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,1024,0.004868444469239977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,2048,0.06556355290942721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,2048,0.10659911235173543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,768,0.004545777622196409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,65536,3.0147599114312063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,1536,0.08496977885564168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,1024,0.033944000800450645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,1024,0.06208533048629761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,512,0.0038293335172865125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,256,0.0035706667436493766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,768,0.0280728903081682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,768,0.05232266585032145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,6144,0.012504888905419244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,128,0.003481777591837777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,64,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,512,0.04159911142455207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,256,0.031275557147132024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,256,32,0.0032071111102898917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,256,128,0.024600888291994732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,128,0.013461333182122974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,64,0.01293777757220798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,65536,0.09675111373265584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,32,0.012784000072214337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,51200,0.07803555329640706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,16384,0.031162665949927434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,16384,0.5151324272155762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,1536,0.04957333207130432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,12288,0.022443556123309668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,512,0.022341334157519873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,256,256,0.016185777054892648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,10240,0.016297777493794758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,12288,0.38900089263916016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,10240,0.32675109969245064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,16384,0.7697671254475912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,51200,1.578703138563368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,8192,0.013774221969975365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,7168,0.012274666792816587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,65536,2.0229085286458335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,10240,0.48939911524454754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,8192,0.26331912146674263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,6144,0.010571555958853828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,7168,0.23231999079386392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,5120,0.009480888644854227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,8192,0.3953191174401178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,6144,0.19985422823164198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,5120,0.1672977738910251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,6144,0.3019377655453152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,7168,0.349089781443278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,5120,0.254584895239936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,4096,0.13227466742197672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,4096,0.20208356115553114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,3584,0.1131697760687934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,3072,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,65536,3.0119334326850047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,12288,0.5827706654866537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,2560,0.006430222342411677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,3584,0.1764835516611735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,3072,0.09519733322991265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,2048,0.005385777602593104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,3072,0.1513777838812934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,2560,0.07897422048780653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,2560,0.12792710463205972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,1536,0.005094222310516569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,2048,0.06390844451056586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,2048,0.10613066620296902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,1024,0.004201777693298128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,1536,0.0849306649631924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,1536,0.047925333182017006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,768,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,4096,0.008007999923494127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,1024,0.062084443039364286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,51200,2.355091518825955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,512,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,768,0.02752444479200575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,256,0.0032186667538351486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,512,0.021727111604478624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,256,0.030346665117475722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,128,0.0028906667398081887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,256,0.01574222246805827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,128,0.024482667446136475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,128,0.012865777644846173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,32,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,64,0.01238933371173011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,65536,0.09151289198133682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,32,0.01218311074707243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,51200,0.074526223871443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,16384,0.030644443300035264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,12288,0.02365066607793172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,16384,0.5147324668036567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,128,1024,0.0331582228342692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,10240,0.019034667147530448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,768,0.05188444587919447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,128,3584,0.0075839997993575195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,8192,0.013332444760534497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,7168,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,6144,0.010676444404655032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4352,128,512,0.04077600108252631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,5120,0.009310222334331935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,8192,0.26311998897128636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,7168,0.2314008871714274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,4096,0.008011555506123437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,6144,0.1994017759958903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,3584,0.007287110719415877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,5120,0.16697422663370767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,3072,0.006950221955776215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,2560,0.005928888916969299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,4096,0.13138222694396973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,2048,0.0057857777509424425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,3584,0.11298133267296685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,3072,0.0943031112353007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,1536,0.004861333303981357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,1024,0.0041617775956789655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,2560,0.07846577962239583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,768,0.003980444537268745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,51200,1.5781235165066188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,2048,0.06386044290330675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,512,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,1536,0.047188444270028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,256,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,1024,0.032552000549104475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,128,0.0028986665937635633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,768,0.027425777581002977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,64,0.002871111035346985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,64,32,0.0028897778441508612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,512,0.021606221795082092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,12288,0.38869865735371906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,128,0.012702222499582501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,65536,2.020680957370334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,64,0.012460444536474017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,32,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,16384,0.027892443868849013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,12288,0.021336888273557026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,51200,0.07635288768344455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,10240,0.012803555362754397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,10240,0.3262755605909559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,8192,0.010703999963071613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,12288,0.3887946605682373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,16384,0.51473511589898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,7168,0.010079999764760336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,10240,0.3258231216006809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,8192,0.2635013262430827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,5120,0.008981333010726506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,7168,0.23146398862202963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,4096,0.007673777639865875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,6144,0.1991137795978122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,3584,0.007646222081449296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,5120,0.16698488924238417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,64,256,0.015463999576038785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,3072,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,2560,0.010506666368908353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,4096,0.13176000118255615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,65536,0.0952026645342509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,3584,0.11373066902160645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,2048,0.0052684446175893145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,1536,0.004561777744028303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,3072,0.0951804452472263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,1024,0.0041653331783082755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,2560,0.07881600326961942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,2048,0.06357422139909533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,768,0.003563555578390757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,1536,0.04713333315319485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,51200,1.5811413658989801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,1024,0.0337119996547699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,256,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,128,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,768,0.027112889620992873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,512,0.021606221795082092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,64,0.0028008888992998335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,256,0.015456888410780164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,32,0.002942222274012036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,128,0.012787555654843649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,65536,2.020234637790256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,64,0.012416889270146688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4352,32,32,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,512,0.003547555456558863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4352,32,6144,0.009335999687512716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,12288,4.0138498942057295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,10240,3.4479832119411893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,16384,5.4313447740342875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,12288,4.4108602735731335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,10240,3.6902025010850696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,16384,6.279368082682292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,8192,2.8644977145724826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,6144,2.112725363837348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,7168,2.3349937862820096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,8192,2.7939927842881946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,7168,2.4204213884141708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,5120,1.6704852845933702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,4096,1.286527951558431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,4096,1.3805066214667425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,5120,1.7442702187432184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,6144,2.18121337890625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,3072,0.966111077202691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,3584,1.222273826599121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,3584,1.1293431388007271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,3072,1.0333769056532118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,2560,0.7703448931376139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,2048,0.6820355521308051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,1024,0.3411280049218072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,2560,0.8731786410013834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,1536,0.4849573241339789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,2048,0.7255119747585721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,1536,0.566880914900038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,768,0.2978657881418864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,256,0.14098666773902044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,768,0.3420613341861301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,512,0.2831946743859185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,128,0.12019556098514134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,1024,0.5123946401807997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,256,0.29446400536431205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,64,0.10474310980902778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,32,0.12118666701846653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,128,0.2367475562625461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,64,0.24088711208767363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,32,0.27225510279337567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,512,0.20406933625539145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,16384,4.121343824598524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,65536,51200,16.73409695095486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,16384,4.947759840223524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,12288,3.2374106513129344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,10240,2.7709990607367625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,12288,3.5966008504231772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,10240,2.944975111219618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,8192,2.229514651828342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,8192,2.2816569010416665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,7168,1.942527135213216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,51200,12.988575405544706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,6144,1.7218142615424261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,7168,1.9417165120442708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,65536,51200,25.789813571506077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,4096,0.9709510803222656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,5120,1.2191378275553386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,6144,1.6953244739108617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,5120,1.445271068149143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,3584,0.9143270916408963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,4096,1.1077164543999565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,3072,0.8094711303710938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,3072,0.8252008756001791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,2560,0.6630053520202637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,3584,1.0420133802625868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,2048,0.5480720202128092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,2560,0.6999057663811578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,1536,0.41847732332017684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,1536,0.4521724383036296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,2048,0.5760889053344727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,1024,0.2999662293328179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,768,0.21972889370388457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,512,0.154384003745185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,1024,0.3383804427252875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,65536,16.754772610134548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,256,0.12836621867285833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,768,0.26731377177768284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,512,0.2560373412238227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,128,0.09472355577680801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,64,0.08266044325298734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,256,0.1985128853056166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,51200,32,0.08732000324461196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,64,0.2031608952416314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,32,0.1951520045598348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,128,0.19234044022030303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,16384,1.3132435480753581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,51200,20.044138590494793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,16384,1.8750567966037328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,12288,1.019709375169542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,51200,4.151151021321614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,10240,0.7828497886657715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,12288,1.3588568369547527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,8192,0.7059884601169162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,10240,1.164031982421875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,65536,5.324103885226779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,7168,0.5968497594197592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,8192,0.9123421774970161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,6144,0.4829395612080892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,5120,0.48781601587931317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,4096,0.3715297645992703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,6144,0.6945164468553332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,7168,0.9575102064344617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,5120,0.5484026802910699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,3584,0.3018977906968859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,3072,0.24346044328477648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,4096,0.54239469104343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,3584,0.38335733943515354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,3072,0.32365867826673717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,2048,0.16395644346872965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,2560,0.278510226143731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,1536,0.11405866675906712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,2048,0.22619732220967612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,1024,0.09130489163928562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,1536,0.18341067102220324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,768,0.07156355513466729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,512,0.05416799916161431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,1024,0.1338533295525445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,768,0.10989777909384833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,256,0.038450668255488075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,512,0.08853066629833645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,128,0.03295733200179206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,256,0.07563289006551106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,64,0.02840977907180786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,128,0.07066577672958374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,32,0.030074665943781536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,64,0.07286577754550509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,32,0.07320711347791883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,16384,2560,0.22443821695115831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,51200,7.988389756944444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,16384,0.9854631423950195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,12288,0.7874071333143445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,16384,1.5552523930867512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,16384,65536,9.948589748806423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,10240,0.6394373575846354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,51200,65536,28.20528496636285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,51200,3.1616418626573353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,10240,0.9298381805419922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,12288,1.1215502421061199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,8192,0.5801066822475857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,7168,0.48066669040256077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,65536,3.865764617919922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,6144,0.38915467262268066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,8192,0.7445573276943631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,7168,0.6304302215576172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,5120,0.3592417769961887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,4096,0.29389066166347927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,6144,0.6083137724134657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,3584,0.2216071155336168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,3072,0.21657244364420572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,5120,0.4775359895494249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,4096,0.357826656765408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,2560,0.16876888275146484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,3072,0.27315645747714573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,3584,0.39242667622036403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,2048,0.1447297732035319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,1536,0.10110933250851101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,1024,0.0784355534447564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,2048,0.1851466629240248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,768,0.05928622351752388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,2560,0.2970044347974989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,512,0.04383377896414863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,1536,0.14757243792215982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,1024,0.11146844757927789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,256,0.0414373344845242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,128,0.025419554776615564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,64,0.03053511182467143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,512,0.07988533046510485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,12288,32,0.03183111217286851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,256,0.06078755855560303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,128,0.05676711267895169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,64,0.057851552963256836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,32,0.06025511026382446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,16384,0.713598198360867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,51200,6.2263904147677955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,768,0.0960586667060852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,12288,0.7059724595811633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,16384,1.3429057863023546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,12288,65536,7.851193745930989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,51200,2.6895874871148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,10240,0.4951270951165094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,12288,1.0216489368014865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,8192,0.44789955351087785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,65536,3.3094293806287975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,7168,0.38284889856974286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,10240,0.8367964426676432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,8192,0.6472204526265463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,6144,0.3651422129737006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,7168,0.566971566942003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,5120,0.27126754654778373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,4096,0.22356979052225748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,3584,0.19568978415595162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,5120,0.40084444151984316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,3072,0.1582391129599677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,6144,0.5128560066223145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,4096,0.35878756311204696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,2560,0.13333511352539062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,3584,0.3291084501478407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,3072,0.25581243303087026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,2560,0.2231768767038981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,1536,0.08984711435106064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,1024,0.06128178040186564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,768,0.05013422171274821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,1536,0.13408888710869685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,512,0.037031110790040754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,1024,0.10229333241780598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,256,0.026869333452648584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,128,0.021479111578729417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,768,0.08017422093285455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,512,0.06515644656287299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,64,0.019581332802772522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,32,0.020376000139448378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,256,0.05543555484877693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,128,0.04981688989533318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,64,0.05021689004368252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,32,0.05123022198677063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,51200,5.1790924072265625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,10240,2048,0.12197155422634548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,2048,0.17225333054860434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,16384,0.7261955473158094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,12288,0.4933297899034288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,16384,1.1538480122884114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,10240,0.4227413336435954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,51200,2.0239599015977645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,10240,65536,7.298430548773871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,8192,0.3520924515194363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,12288,0.9359049267239041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,7168,0.2889271047380236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,10240,0.7069075372483996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,6144,0.26767465803358287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,65536,2.844789293077257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,8192,0.5895902315775553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,5120,0.22340355979071724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,7168,0.5501279830932617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,4096,0.19234932793511283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,6144,0.4655893113878038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,3584,0.14736089441511366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,3072,0.14089243941836888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,5120,0.4225040011935764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,2560,0.11580799685584174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,3584,0.24824712011549208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,2048,0.0933084421687656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,3072,0.2119964493645562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,1024,0.04881155490875244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,2560,0.2061013380686442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,1536,0.11986400021447076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,768,0.0369484457704756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,512,0.028175999720891316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,1024,0.08623288737403022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,256,0.021362667282422382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,768,0.06969422101974487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,512,0.057895110713111035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,256,0.04604711135228475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,64,0.015547555353906421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,128,0.04202933443917168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,32,0.016158221496476066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,64,0.03937955697377523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,32,0.04000711109903123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,4096,0.2784453233083089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,51200,4.437736935085721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,1536,0.06872177786297269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,2048,0.15301956070794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,8192,128,0.017729777428838942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,16384,0.5706586837768555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,8192,65536,5.620550367567275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,12288,0.44923824734157985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,16384,1.064168930053711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,10240,0.37135910987854004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,51200,1.7739440070258246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,12288,0.8191973368326823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,8192,0.3037528991699219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,10240,0.7286462253994412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,7168,0.274162663353814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,65536,2.2837386661105685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,6144,0.23044443130493164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,8192,0.5837875472174751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,5120,0.19985244009229872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,4096,0.15537422233157688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,7168,0.4598746829562717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,3584,0.13864621851179335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,6144,0.39579910702175564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,5120,0.3770426644219293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,3072,0.12318489286634658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,3584,0.22411823272705078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,4096,0.3126586543189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,2560,0.10123466783099705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,2048,0.08312977684868707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,1536,0.05611822340223524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,3072,0.19404089450836182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,1024,0.04241066508822971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,2560,0.17807555198669434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,768,0.034655110703574285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,2048,0.13710489537980822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,1536,0.10635377963383992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,512,0.025088888075616624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,1024,0.07940177785025702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,256,0.019814221395386588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,128,0.016182222300105624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,768,0.06915644142362806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,64,0.013719999955760108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,256,0.040885332557890154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,7168,32,0.014111111561457316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,128,0.03601600064171685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,64,0.03632888860172696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,32,0.03495999839570787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,51200,4.066727108425565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,512,0.05272533496220907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,16384,0.4980293379889594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,7168,65536,4.994255913628472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,51200,1.6381075117323134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,65536,1.943832821316189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,12288,0.42586755752563477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,10240,0.34189867973327637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,8192,0.25567732916937935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,16384,0.9789475335015191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,7168,0.2607564396328396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,12288,0.7506302197774252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,6144,0.19154844019148085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,10240,0.6008568869696723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,8192,0.6008257865905762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,4096,0.1358835564719306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,5120,0.1651839945051405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,7168,0.43404176500108504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,3584,0.10997600025600857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,3072,0.09532711240980361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,6144,0.3951431115468343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,5120,0.3032906585269504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,2560,0.0854053364859687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,4096,0.2503937880198161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,2048,0.07198044326570299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,3584,0.2082151174545288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,1536,0.052700443400277026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,1024,0.03556177682346768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,3072,0.17702221870422363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,768,0.026716444227430556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,2048,0.12565155824025473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,512,0.02392533255947961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,256,0.017328000730938382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,1024,0.07386933432685004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,768,0.0588408907254537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,128,0.013630222115251752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,64,0.015141333142916361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,256,0.036121779017978244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,6144,32,0.015535111228624979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,128,0.03346577617857192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,51200,3.498773362901476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,64,0.03258311086230808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,32,0.03160533308982849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,2560,0.15431643856896296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,1536,0.09855555825763279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,65536,4.564380645751953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,6144,512,0.04634311132960849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,12288,0.2989484469095866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,16384,0.4274017810821533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,51200,1.3270799848768446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,65536,1.6074960496690538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,10240,0.28586843278672963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,8192,0.22890843285454643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,12288,0.6573066711425781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,16384,0.8925555547078451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,7168,0.22739733590020073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,6144,0.15424088637034097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,10240,0.5738764339023167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,8192,0.4668266508314345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,4096,0.09336533149083455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,7168,0.4661911328633626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,6144,0.3338017728593614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,3584,0.09749422470728557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,5120,0.2773475646972656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,3072,0.08115644587410821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,4096,0.22246132956610787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,2560,0.07078488667805989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,2048,0.05783910883797539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,3072,0.1638924413257175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,1536,0.042232887612448804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,2560,0.13693155182732478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,1024,0.027845333019892376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,2048,0.11393688784705268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,768,0.022267555197079975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,1536,0.09070489141676162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,512,0.018093332648277283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,1024,0.0668826699256897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,256,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,768,0.053575999206966825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,128,0.012119111087587146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,512,0.041386667225095965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,64,0.01050222251150343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,256,0.0322382218307919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,51200,3.148468441433377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,128,0.029373334513770208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,5120,0.15533333354526097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,64,0.028777778148651123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,32,0.02882755464977688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,3584,0.23160711924235025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,16384,0.3470906681484646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,5120,65536,4.297648111979167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,51200,1.129518191019694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,65536,1.2597324583265517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,5120,32,0.010684444672531553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,12288,0.27246756023830837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,10240,0.2138000064425998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,8192,0.17933689223395455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,7168,0.1816906664106581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,10240,0.49495024151272243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,16384,0.8325075573391385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,6144,0.1281928883658515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,5120,0.10764800177680121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,12288,0.7394524680243598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,8192,0.4312346776326497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,4096,0.08266488711039226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,3584,0.07385155227449205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,6144,0.3015253278944227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,3072,0.06799999872843425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,5120,0.2528666655222575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,4096,0.2026231156455146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,3584,0.17441956202189127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,2048,0.046606222788492836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,1536,0.03608533408906724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,2560,0.1245759990480211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,1024,0.02409244411521488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,2048,0.10715911123487686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,768,0.020055111911561754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,1536,0.08304533031251696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,512,0.014775110615624322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,1024,0.05947644180721707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,256,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,768,0.04831288920508491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,51200,2.766685273912218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,512,0.03622488843070136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,128,0.010332444475756751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,64,0.009015999734401703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,256,0.028472890456517536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,32,0.008976000050703684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,64,0.025417778227064345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,128,0.026748443643252056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,32,0.025063999825053748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,7168,0.43645511733161074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,4096,2560,0.057393776045905225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,65536,3.5725877549913196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,4096,3072,0.14716977543301052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,16384,0.30114934179517955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,12288,0.20820889208051893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,10240,0.18807555569542778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,51200,0.9036711586846246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,65536,1.1504604551527235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,8192,0.1509502198961046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,12288,0.5604533089531792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,16384,0.7466266420152453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,7168,0.14749866061740452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,10240,0.48865154054429794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,6144,0.11012444231245254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,5120,0.10905689001083374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,4096,0.0706604454252455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,8192,0.46575556861029727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,7168,0.39292356703016496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,6144,0.2871217727661133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,5120,0.24359822273254395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,3072,0.059691554970211454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,2560,0.04978933268123203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,4096,0.22153777546352812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,2048,0.04099377658632066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,3584,0.16879733403523764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,1536,0.029736889733208552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,3072,0.1392293373743693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,2560,0.1212728950712416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,1024,0.021125333176718816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,768,0.01799199978510539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,2048,0.10098844766616821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,512,0.014504889647165934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,1536,0.07838310798009236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,256,0.01070844464831882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,1024,0.05531111028459337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,768,0.04516355527771843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,128,0.009346666435400644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,64,0.008227555288208855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,512,0.03537955549028184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,32,0.00868444475862715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,256,0.026752000053723652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,128,0.024412444896168176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,64,0.023696889479955036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,32,0.023336889015303716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,51200,2.4905982547336154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3584,3584,0.06362755431069268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,16384,0.2574400107065837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,51200,0.8346151245964898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3584,65536,3.2493413289388022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,65536,1.0559448666042752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,10240,0.18120266331566703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,16384,0.7053057882520887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,8192,0.13451911343468562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,7168,0.12983911567264134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,12288,0.6324284341600206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,10240,0.5314639939202203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,8192,0.359186675813463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,6144,0.0984319978290134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,5120,0.08436266581217448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,4096,0.06823111242718168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,7168,0.35661334461636013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,6144,0.28362488746643066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,3584,0.05527111225657993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,3072,0.04638933473163181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,12288,0.19051733281877306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,2560,0.04095822241571214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,4096,0.1801288922627767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,2048,0.03387466735310025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,3584,0.16154489252302381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,1536,0.0266951107316547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,3072,0.13227821720971003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,1024,0.01982222166326311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,2560,0.11227556069691975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,768,0.015791111522250705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,512,0.011808888779746162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,51200,2.349008984035916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,1024,0.05205333232879639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,256,0.009653333160612319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,512,0.03225955698225234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,128,0.00832177781396442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,64,0.007320000065697565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,256,0.025096888343493145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,3072,32,0.007620444728268518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,128,0.022720000810093347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,64,0.021634666456116572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,65536,2.955521689520942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,32,0.02167911165290409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,5120,0.23063821262783477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,16384,0.21577866872151694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,2048,0.0913706686761644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,65536,0.8584426773918999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,1536,0.0718017750316196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,3072,768,0.041456000672446355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,10240,0.14416621790991888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,8192,0.10741066932678223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,16384,0.6676266458299426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,10240,0.42303911844889325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,12288,0.5462240113152398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,7168,0.10097599691814846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,6144,0.08042399750815497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,8192,0.34317154354519314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,5120,0.06566666894488864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,4096,0.051557332277297974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,7168,0.30057154761420357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,6144,0.2578302224477132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,3584,0.048708445496029325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,51200,0.592417769961887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,3072,0.038422223594453596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,4096,0.17345689402686226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,2560,0.03257866700490316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,2048,0.02684088879161411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,3584,0.14636888768937853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,3072,0.12462488810221355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,1536,0.02258577777279748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,12288,0.16178222497304282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,51200,2.1370275285508895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,1024,0.015206222732861837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,2560,0.10594044129053752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,768,0.012841777669058906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,1536,0.0662062234348721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,1024,0.048862222168180675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,768,0.039292444785436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,256,0.00795288880666097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,512,0.030204445123672485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,128,0.007239110767841339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,64,0.0069253332912921906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,256,0.023014222582181294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,32,0.0069217777086628815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,128,0.021295999487241108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,64,0.020239111449983384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,65536,2.7668870290120444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,32,0.019959999455346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,16384,0.16445955965254042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,5120,0.21845955318874785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,65536,0.61026578479343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,12288,0.12256356080373128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,51200,0.5065911081102159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,10240,0.10370933347278172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,8192,0.0824071102672153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2560,2048,0.08604622549480861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,16384,0.6294790903727213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,10240,0.43081778950161403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,7168,0.07872266901863946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,6144,0.06385778056250678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,8192,0.32231465975443524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,5120,0.05481600099139743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,7168,0.2887769010331896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,6144,0.2441022131178114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,4096,0.04493066668510437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,5120,0.2047119935353597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,3584,0.03730400072203742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,3072,0.031200889084074233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,4096,0.16117421785990396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,2560,0.02847733431392246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,3072,0.1179902156194051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,51200,1.9986159006754558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,2048,0.02420711186197069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,1536,0.018394667241308425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,2560,0.09918755292892456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,1024,0.014447111222479077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,2048,0.08052088816960652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,1536,0.06200177801979912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,768,0.011009777585665384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,12288,0.48890309863620335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,512,0.009170666337013245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,256,0.006962666908899943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,1024,0.04336444536844889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,128,0.006589333216349284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,65536,2.5450835757785373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,768,0.036673777633243136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,512,0.028491556644439697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,64,0.005912000106440649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2048,32,0.005952000204059813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,256,0.021764443980322942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,128,0.019273777802785236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,64,0.018580444984965853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,32,0.018554665976100497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,16384,0.1245831118689643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,51200,0.39202578862508136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,65536,0.47340091069539386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,2048,3584,0.13913688394758436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,12288,0.1072302195760939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,2560,512,0.010346666806273991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,10240,0.0900613334443834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,8192,0.07045066356658936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,7168,0.061497781011793345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,16384,0.5897902382744683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,12288,0.46372000376383465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,8192,0.3021537727779812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,10240,0.3973715570237901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,6144,0.05080177717738681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,5120,0.044277333550983004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,4096,0.03638489047686259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,7168,0.2673715485466851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,3072,0.02666577696800232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,6144,0.23357065518697104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,5120,0.1911626656850179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,4096,0.15017333295610216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,2560,0.023065777288542852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,3584,0.1327297819985284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,1536,0.015574221809705099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,3072,0.11028266615337795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,1024,0.0118231111102634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,2560,0.09233866797553168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,2048,0.07602666483985053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,768,0.010040889183680216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,512,0.007919111185603673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,1024,0.04081955552101135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,256,0.0063822223908371395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,768,0.033955554167429604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,512,0.02647288971477085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,128,0.005561777700980504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,64,0.004937777916590373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,256,0.020021332634819877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,32,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,128,0.017849778135617573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,64,0.01718844473361969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,32,0.016554666890038382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,65536,2.3515493604871964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,3584,0.03165600034925673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,65536,0.3629048930274115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,16384,0.09704266654120551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,51200,0.28447556495666504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1536,2048,0.019912888606389362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,10240,0.06311644448174371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,1536,0.05953333112928602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,8192,0.04855733447604709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,12288,0.42735910415649414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1536,51200,1.8429431915283203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,16384,0.5687315728929307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,7168,0.042648888296551175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,10240,0.35291110144721133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,6144,0.036657777097490095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,5120,0.028872887293497723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,4096,0.024156444602542456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,8192,0.2845635679033068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,3584,0.020945777495702107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,6144,0.2167146603266398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,5120,0.18108799722459581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,3072,0.018374222848150466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,4096,0.14159822463989258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,2560,0.016048888365427654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,3584,0.12213867240481907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,2048,0.013810666898886362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,3072,0.10345333152347141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,1536,0.01129422254032559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,2560,0.08654844760894775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,1024,0.00904799997806549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,2048,0.07091022200054593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,51200,1.7169759538438585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,768,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,1536,0.05455644594298469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,512,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,256,0.0052622221410274506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,768,0.031113776895735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,512,0.024681778417693243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,65536,2.1926915910508895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,256,0.018187556001875136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,64,0.00443111111720403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,128,0.016185777054892648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,64,0.015459555718633862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,32,0.015127999915017022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,7168,0.24989867210388184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,65536,0.2772604359520806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,51200,0.21487289004855684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,16384,0.07276533047358195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,12288,0.07415911224153307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,12288,0.05350666575961643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,10240,0.04684533344374763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,1024,1024,0.037795556916130915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,8192,0.03643555442492167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,128,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,7168,0.031297776434156634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,16384,0.5364204512702094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,12288,0.40584532419840497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,10240,0.3407164414723714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,1024,32,0.004536889079544279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,6144,0.02829422222243415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,5120,0.023415111833148535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,4096,0.01955111159218682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,3584,0.017737777696715463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,8192,0.27497778998480904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,3072,0.015934222274356417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,7168,0.24151110649108887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,2560,0.013811555173661975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,6144,0.20831999513838026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,5120,0.17396177185906303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,4096,0.13680711057451037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,2048,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,3584,0.1175617774327596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,1536,0.009880888793203566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,3072,0.09917866521411473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,1024,0.007820444802443186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,768,0.006962666908899943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,2560,0.08280266655815972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,2048,0.06799999872843425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,512,0.005590222362014983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,1536,0.05239822136031257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,1024,0.03637689020898607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,256,0.004923555586073133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,128,0.004504888835880491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,768,0.029866665601730347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,32,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,512,0.023902222514152527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,256,0.017571555243598092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,128,0.015398222539159985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,64,0.014713777436150445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,51200,1.6569564607408311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,32,0.014162666267818876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,16384,0.04737600021892124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,65536,0.19751377900441489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,51200,0.14998755190107557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,12288,0.039170665873421565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,768,65536,2.1105244954427085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,8192,0.02329866588115692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,10240,0.32815466986762154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,16384,0.5156390931871202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,7168,0.020399111840460036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,8192,0.2654168870713976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,6144,0.017874666386180453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,5120,0.015356444650226168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,7168,0.2327022287580702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,6144,0.20061333974202475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,5120,0.1674577792485555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,768,64,0.004238222208287981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,3584,0.011767999993430244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,3072,0.010495111346244812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,4096,0.13180000252193874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,3584,0.11280622747209336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,2560,0.009664889011118147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,2048,0.008290666672918532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,3072,0.09521244631873237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,1536,0.00703111125363244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,2560,0.07960710922876994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,51200,1.5881360371907551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,2048,0.06485066811243693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,1024,0.005609777652555042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,768,0.00526577772365676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,1536,0.048751999934514366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,512,0.004549333204825719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,1024,0.03423555692036947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,12288,0.39252977901034886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,768,0.028778665595584448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,256,0.0041804446114434134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,128,0.0035537779331207275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,512,0.0229751103454166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,64,0.0035342222286595237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,65536,2.0275537702772355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,32,0.0038213332494099936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,256,0.016807110773192514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,128,0.014444443914625378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,64,0.013797333670987023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,65536,0.11657510863410102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,512,32,0.013783999615245394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,51200,0.09404889080259536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,16384,0.037639998727374606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,4096,0.013018666870064206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,12288,0.025664889150195654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,10240,0.020394666327370536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,8192,0.015855110353893705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,12288,0.37529423501756454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,512,10240,0.03066844410366482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,16384,0.49656269285413956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,7168,0.014143110977278816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,8192,0.2544524404737684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,6144,0.012792888614866467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,5120,0.011307555768224927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,4096,0.009868444667922126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,7168,0.2238933245340983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,6144,0.1930302249060737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,5120,0.1606302261352539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,3584,0.008656889200210571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,4096,0.12627377774980333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,3072,0.008628444539176093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,2560,0.007675555845101674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,2048,0.00665511108107037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,1536,0.005625777774386936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,3584,0.10822488864262898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,3072,0.09062666363186306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,2560,0.07586133480072021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,1024,0.004920888692140579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,2048,0.06190222501754761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,768,0.00453244439429707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,512,0.004016889052258598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,1536,0.04655199911859301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,256,0.003535110917356279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,128,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,1024,0.032403555181291364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,768,0.02753511071205139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,51200,1.5226311153835719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,64,0.0033093332830402586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,256,0.01586666703224182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,256,32,0.003563555578390757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,128,0.013448889056841532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,64,0.013088000317414602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,32,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,65536,0.09930488798353408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,51200,0.07987378040949504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,16384,0.030745777818891738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,10240,0.31557512283325195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,12288,0.022325333621766832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,65536,1.9454000261094835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,10240,0.015287111202875773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,8192,0.013578666581047906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,7168,0.012418666647540199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,10240,0.3080711099836561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,12288,0.3674417866600885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,8192,0.24932977888319227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,16384,0.4866097768147786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,6144,0.011019555230935415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,5120,0.010031110710567897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,4096,0.008640888664457533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,7168,0.21905244721306694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,3584,0.008273777862389883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,3072,0.007302222152551015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,6144,0.18915111488766143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,5120,0.15738044844733343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,4096,0.12344355053371853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,3584,0.10564444462458293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,2560,0.006776888751321369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,2048,0.005906666732496685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,1536,0.005247999810510212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,1024,0.0042275554604000514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,256,512,0.021963554951879714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,2560,0.0745662252108256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,768,0.004134222037262387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,2048,0.0605928897857666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,1536,0.045215109984079994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,512,0.0035617777870761026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,256,0.003216000066863166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,1024,0.03188000122706095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,128,0.0032257777121331957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,64,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,768,0.027104889353116352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,512,0.02126577827665541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,256,0.015509333875444202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,128,32,0.0032142222755485107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,128,0.013111111190583972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,64,0.012395555774370829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,65536,0.09615288840399848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,32,0.01239377756913503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,51200,0.07079111205206977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,16384,0.02812622321976556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,12288,0.01867022282547421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,65536,1.9066338009304469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,10240,0.014821334017647637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,12288,0.3668702178531223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,8192,0.01237066669596566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,3072,0.08875644207000732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,7168,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,8192,0.24888179037306044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,6144,0.010055999788973067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,7168,0.21853244304656982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,5120,0.009106666677527958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,128,51200,1.4908808602227106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,4096,0.00795377790927887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,6144,0.1886071099175347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,5120,0.15734577178955078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,3584,0.007250666618347168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,3072,0.00657155571712388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,51200,1.4885475370619032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,4096,0.12325689527723525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,2560,0.005958222266700532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,2048,0.005551110953092575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,3584,0.1056106686592102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,3072,0.08808710840013291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,1536,0.004861333303981357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,1024,0.0041866666740841335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,65536,1.90465694003635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,16384,0.48588355382283527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,768,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,512,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,1536,0.04395111070738899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,1024,0.03151377704408433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,10240,0.3082435660892063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,768,0.026407111022207472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,128,0.0031031111462248694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,512,0.021197333931922913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,256,0.015122666954994202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,128,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,64,0.012431110772821637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,65536,0.09045155843098958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,32,0.01204533295498954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,51200,0.07159199979570177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,16384,0.4860071076287164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,2560,0.07407910956276788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,12288,0.0165964447789722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,64,2048,0.06037244531843397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,256,0.0031964443624019623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,8192,0.011357333097192975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,64,32,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,7168,0.010394666757848527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,10240,0.3078604539235433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,6144,0.009382222261693742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,8192,0.24871465894911024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,16384,0.027040888865788777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,5120,0.011393778026103973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,4096,0.009630222287442949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,7168,0.21887644131978354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,51200,1.4907271067301433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,3584,0.009872888525327047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,6144,0.18849599361419678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,3072,0.008811555802822113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,2560,0.00795733349190818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,4096,0.12316621674431695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,3584,0.10697778065999348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,2048,0.0052168890833854675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,3072,0.08949777815077041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,65536,1.9054497612847223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,1536,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,2560,0.0747013356950548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,1024,0.0038986665507157645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,768,0.0035626664757728577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,512,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,2048,0.06042844719356961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,1536,0.04577777783075968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,1024,0.03179288903872172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,256,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,768,0.02641955514748891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,64,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,256,0.015134221977657743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,128,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,64,0.012080888781282636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,12288,0.3668791188134088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,32,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,5120,0.157242668999566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,10240,0.01274400038851632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4097,32,128,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4097,32,512,0.02130311065249973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,12288,3.786329057481554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,16384,4.910642835828993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,12288,4.41935560438368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,16384,6.237169901529948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,10240,3.412290573120117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,16384,5.768468644883897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,10240,3.629060533311632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,12288,4.234011756049262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,8192,2.604928970336914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,10240,3.4184017181396484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,8192,2.7591760423448353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,8192,2.742979473537869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,7168,2.270453347100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,7168,2.4205243852403426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,6144,1.939992904663086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,7168,2.38117429945204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,6144,2.0605350070529513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,5120,1.5564088821411133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,51200,15.884285820855034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,4096,1.2383626302083333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,6144,2.0878853268093533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,5120,1.7397404776679144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,4096,1.379044426812066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,5120,1.7579030990600586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,4096,1.394399113125271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,3584,1.0864551332261827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,3584,1.2117155922783744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,3072,1.0369715160793729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,3072,1.0705831315782335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,3584,1.2642301983303494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,2560,0.7632853190104166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,2560,0.870738665262858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,2048,0.5764328638712565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,1536,0.44271466467115617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,2048,0.7730542288886176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,3072,1.0202870898776584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,2048,0.7229777971903483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,1024,0.32141155666775173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,2560,0.8836097717285156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,1536,0.6031609111362034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,1024,0.44474045435587567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,768,0.2543697886996799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,1536,0.5778951115078396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,512,0.19714666737450492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,1024,0.4263484477996826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,768,0.3488604492611355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,256,0.14529689153035483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,768,0.33507111337449813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,512,0.3099093437194824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,128,0.12192000283135308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,512,0.2824764516618517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,256,0.20965333779652914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,64,0.10433689090940688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,128,0.16468355390760633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,65536,32,0.10051555765999688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,256,0.24963288837009004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,128,0.23406577110290527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,64,0.24314665794372559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,32,0.24945333268907335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,65536,51200,26.474404229058162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,16384,3.91975106133355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,51200,12.235122680664062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,16384,4.938645256890191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,65536,16.074749416775173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,12288,2.996277279324002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,16384,4.626333448621962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,51200,15.457655164930555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,12288,3.502139621310764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,51200,19.97254096137153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,10240,2.62319204542372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,12288,3.3928000132242837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,8192,2.1446221669514975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,10240,2.8515404595269094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,10240,2.80785772535536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,8192,2.2132576836480036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,7168,1.7929492526584203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,8192,2.2479947408040366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,6144,1.457289801703559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,7168,1.9329742855495875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,65536,20.017871432834202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,6144,1.6327146954006617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,65536,26.140184190538193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,7168,1.9981822967529297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,5120,1.1986302269829643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,5120,1.3590044445461695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,4096,0.9307307137383355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,4096,1.106296009487576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,3584,0.8509182400173612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,6144,1.680450651380751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,4096,1.1011955473158095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,3584,0.9386204613579644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,3072,0.6925093332926432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,5120,1.3457021713256836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,3584,0.9361146291097006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,3072,0.8608737521701388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,2560,0.6686728795369467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,2048,0.5226764678955078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,2560,0.6906097730000814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,3072,0.7985964351230197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,1536,0.44748444027370876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,1024,0.27058400048149955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,2048,0.5977102385626899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,2560,0.6956746843126086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,2048,0.5601866510179307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,1536,0.6326417922973633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,768,0.2797813415527344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,1024,0.4717733595106337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,1024,0.33088623152838814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,512,0.14453866746690539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,256,0.11351554923587376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,768,0.2905297809176975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,512,0.22642845577663848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,512,0.22512356440226236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,256,0.20167377259996203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,128,0.08620355526606242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,256,0.17153778341081408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,64,0.07617777585983276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,32,0.0786879989835951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,51200,768,0.20823821756574842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,64,0.19004800584581164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,1536,0.43596000141567653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,32,0.19251910845438638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,51200,128,0.18974844614664713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,51200,128,0.1352728870179918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,16384,1.3585084279378254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,51200,3.7607947455512156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,16384,1.8889715406629775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,65536,4.8513743082682295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,12288,0.9070729149712456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,16384,1.9090133243136937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,12288,1.3721831639607747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,12288,1.3751822577582464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,10240,0.9126817915174695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,10240,1.1182062360975478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,8192,0.707039091322157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,51200,7.6243336995442705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,51200,6.131130642361111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,10240,1.1303626166449654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,7168,0.5895137786865234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,8192,0.880059560139974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,7168,0.8067706425984701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,6144,0.5675342347886827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,65536,9.7017822265625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,6144,0.6552631060282389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,65536,7.86617448594835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,7168,0.8290524482727051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,5120,0.4357031186421712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,4096,0.3061617745293511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,6144,0.6854684617784289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,5120,0.5758408970303005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,5120,0.5686844189961752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,4096,0.4459724426269531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,3584,0.2725875642564562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,4096,0.48575380113389754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,8192,0.9085369110107422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,3072,0.24402311113145617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,3584,0.37813509835137266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,3584,0.4101591110229492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,3072,0.3270675606197781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,2048,0.15948622756534153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,3072,0.3808151086171468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,2560,0.27322755919562447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,1536,0.13309066825442845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,2560,0.3098391162024604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,2048,0.22623909844292533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,2048,0.24601954883999297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,1024,0.09758222103118896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,1536,0.17959288756052652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,768,0.06609066989686754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,1536,0.19537333647410074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,1024,0.1397742165459527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,512,0.0539173318280114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,1024,0.14940888351864284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,768,0.1126142210430569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,256,0.037321776151657104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,128,0.03086400032043457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,512,0.08723022540410359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,512,0.10070577594969009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,256,0.08177155256271362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,256,0.0748151143391927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,128,0.0695813364452786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,128,0.06016177601284451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,32,0.02609511050913069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,64,0.07113155391481188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,16384,32,0.07191999753316243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,2560,0.2057102256351047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,16384,768,0.12532622284359402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,16384,64,0.026410667432679072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,16384,1.0861102210150826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,51200,3.250865724351671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,65536,3.8651945326063366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,16384,1.541253301832411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,12288,0.7945733070373535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,12288,1.0960942374335396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,16384,1.562409824795193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,10240,0.6058435440063477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,51200,5.888281928168403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,12288,1.1539395650227864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,10240,0.9474826388888888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,8192,0.5067955652872721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,51200,4.933394538031684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,8192,0.7266364627414279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,10240,0.9591395060221354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,7168,0.5243911213344997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,65536,7.608842637803819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,8192,0.7579333517286512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,6144,0.36975378460354275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,65536,6.503866831461589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,7168,0.6491449144151475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,5120,0.3108862241109212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,6144,0.6387733353508843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,4096,0.23535911242167154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,5120,0.5221706496344672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,6144,0.5910577774047852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,3584,0.2052346732881334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,5120,0.48912710613674587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,4096,0.3651439878675673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,3584,0.3077555497487386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,3072,0.18375199370914033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,4096,0.4517146746317546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,2560,0.14798488881852892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,3584,0.3505280017852783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,2048,0.1271022160847982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,2560,0.22811023394266763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,3072,0.2977831098768446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,7168,0.6657457881503636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,1536,0.10642400052812363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,2560,0.2742604414621989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,1024,0.06790933344099256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,2048,0.18649066819085014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,2048,0.2139822244644165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,1536,0.16744532850053576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,1536,0.14485155211554632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,1024,0.12645333343082005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,1024,0.11071822378370498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,512,0.03972266780005561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,768,0.1054426696565416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,768,0.087208886941274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,256,0.028685334655973647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,512,0.07278311252593994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,128,0.024179556303554114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,256,0.06462133593029447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,256,0.060214221477508545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,64,0.020972443951500788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,3072,0.2638355626000298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,128,0.051111999485227794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,128,0.05608355336719089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,64,0.05619821945826212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,12288,32,0.0578977796766493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,768,0.052417778306537204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,12288,512,0.0839831100569831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,12288,32,0.02139733400609758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,65536,51200,22.651482476128475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,16384,0.8852337731255425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,51200,2.5777155558268228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,65536,3.298635482788086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,16384,1.3379920323689778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,12288,0.6792053116692437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,16384,1.4168693754408095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,12288,0.9785359700520834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,12288,1.04057863023546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,10240,0.816921763949924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,8192,0.387027555041843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,10240,0.5230515797932943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,10240,0.8637262450324165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,51200,5.07748285929362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,7168,0.32009779082404244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,6144,0.26910310321384007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,8192,0.717284467485216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,7168,0.5645653406778971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,65536,6.523706648084853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,51200,4.5160238477918835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,5120,0.26304533746507436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,7168,0.6328239970737034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,6144,0.4873493512471517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,4096,0.22160532739427355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,6144,0.5322453180948893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,3584,0.19859822591145834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,4096,0.31791289647420246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,5120,0.4337422317928738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,4096,0.36118398772345645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,5120,0.45671553081936306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,65536,5.835984971788194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,3072,0.1486133337020874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,3584,0.27311733033921987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,2560,0.1311146683163113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,3072,0.23883289761013457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,3072,0.27402933438618976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,3584,0.4154977798461914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,2560,0.2607662147945828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,2560,0.21588177151150176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,2048,0.17715822325812447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,1536,0.08176266484790377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,1024,0.056361774603525795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,2048,0.19384800063239205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,768,0.04451910985840691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,1536,0.1580853329764472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,1536,0.14118399884965685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,1024,0.1163511143790351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,1024,0.10047822528415257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,512,0.034719109535217285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,256,0.025265778104464214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,768,0.10012088881598578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,768,0.07773866918351915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,128,0.023331556055280898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,512,0.0772248903910319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,256,0.05418755610783895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,256,0.06148266792297363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,64,0.019298666053348117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,128,0.049235555860731334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,32,0.020047111643685233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,10240,128,0.04836977852715386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,8192,0.6398737695482042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,64,0.050322665108574756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,32,0.05016711023118761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,10240,2048,0.10427111387252808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,10240,512,0.06485511196984185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,16384,0.6920773188273112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,51200,2.097656038072374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,65536,2.634181340535482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,12288,0.48526668548583984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,16384,1.169083595275879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,12288,0.850546677907308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,10240,0.387351115544637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,16384,1.262569745381673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,8192,0.3392186694675022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,12288,0.939300431145562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,10240,0.6983866691589355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,51200,4.211090511745877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,7168,0.29837332831488717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,10240,0.8178266419304742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,8192,0.606927129957411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,6144,0.23903022872077095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,8192,0.6279937956068251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,7168,0.5048773553636339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,51200,3.987396240234375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,5120,0.1989368862575955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,6144,0.42526666323343915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,4096,0.1577226718266805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,5120,0.35151200824313694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,6144,0.4889555507236057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,3584,0.13400977187686497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,4096,0.27610932456122506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,5120,0.4170657793680827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,4096,0.3602622350056966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,3072,0.11730044417911106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,3584,0.24019021458095977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,65536,5.077312893337674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,2560,0.0983404450946384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,3584,0.2865271038479275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,3072,0.20825510554843477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,2048,0.0897031095292833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,3072,0.25728623072306317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,2560,0.17463110552893746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,1536,0.061928888161977134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,1024,0.04338399900330437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,2048,0.14380533165401882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,2560,0.21766311592525908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,2048,0.17412800259060332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,768,0.03501244386037191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,1536,0.13840177324083117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,1024,0.10464088784323798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,1024,0.09073333607779609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,512,0.02755822241306305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,768,0.06801955567465888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,768,0.08790755271911621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,512,0.07225244575076632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,512,0.05575022432539198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,256,0.053912887970606484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,256,0.04526577724350823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,64,0.014479110638300577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,128,0.04213688770929972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,128,0.0413973331451416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,32,0.014863111906581454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,64,0.04044355617629157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,32,0.03935022155443827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,1536,0.11446932951609294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,8192,65536,5.471310085720486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,256,0.01924622224436866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,8192,128,0.01664888858795166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,16384,0.6657662391662598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,8192,7168,0.5843608644273546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,65536,2.45778316921658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,51200,2.1204649607340493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,12288,0.4851377805074056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,16384,1.0892435709635417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,10240,0.3427591058943007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,16384,1.2102977964613173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,12288,0.8099635442097982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,8192,0.27098221249050564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,12288,0.9102533128526477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,10240,0.6868577533298068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,7168,0.23824887805514863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,10240,0.7513262430826823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,8192,0.5329448911878798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,51200,3.8777067396375866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,6144,0.1930302249060737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,8192,0.6047502093844944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,7168,0.46167733934190536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,5120,0.17302578025394014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,65536,5.07329347398546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,7168,0.5331510967678493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,6144,0.39888978004455566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,4096,0.1320693360434638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,5120,0.32690665456983775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,6144,0.46153868569268125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,3584,0.11637066470252143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,4096,0.2554559972551134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,5120,0.3909768793318007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,3072,0.09578933318456014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,65536,4.805885314941406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,3584,0.2225280072953966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,3584,0.2724826600816515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,2560,0.08362044228447808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,3072,0.19095555941263834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,3072,0.24042399724324545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,2048,0.07151910993787977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,2560,0.16281955771976048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,2560,0.20002488295237222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,1536,0.05859022008048164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,1024,0.038775109582477145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,2048,0.1332168844011095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,2048,0.16809866163465711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,768,0.030277334981494482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,1536,0.10577599869834052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,1536,0.13283822271558973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,51200,3.7869750128852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,512,0.02731288969516754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,1024,0.10024088621139526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,256,0.021525333325068157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,768,0.0843377775616116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,768,0.06348355611165364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,512,0.06684355603324042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,128,0.01647822227742937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,512,0.051134222083621554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,64,0.014081777797804939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,256,0.04053689042727152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,256,0.05083910955323113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,7168,32,0.014697778556081982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,128,0.03607022100024753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,64,0.03517955541610718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,32,0.03500977820820279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,4096,0.31334400177001953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,7168,1024,0.07914044459660848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,7168,128,0.03884444302982754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,16384,0.47539377212524414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,51200,1.5486159854465062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,65536,1.929634730021159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,12288,0.372670226626926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,16384,0.9748533036973742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,10240,0.3263324366675483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,12288,0.7346791161431206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,16384,1.1230559878879123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,8192,0.27909599410163033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,12288,0.851968871222602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,10240,0.6283946567111546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,10240,0.7038995424906412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,7168,0.22204000420040557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,51200,3.481480916341146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,8192,0.5191013548109267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,8192,0.5712089008755153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,6144,0.1991431050830417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,7168,0.42066311836242676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,6144,0.364774227142334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,7168,0.5079004499647353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,6144,0.43669690026177305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,4096,0.1322853300306532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,65536,4.530926174587674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,5120,0.30169065793355304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,5120,0.3708453443315294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,3584,0.11286044120788574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,4096,0.23630756802029082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,3072,0.09613333145777385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,51200,3.4960265689425998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,3584,0.2049928903579712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,4096,0.29146843486362034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,2560,0.08365422487258911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,3584,0.25695644484625924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,2048,0.0629262195693122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,3072,0.17535911666022408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,3072,0.22898133595784506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,2560,0.14978488286336264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,2560,0.18842577934265137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,1536,0.04958488874965244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,1024,0.03610488772392273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,2048,0.1232373317082723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,65536,4.514110989040799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,2048,0.15705245070987278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,5120,0.16860089037153456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,768,0.02908266584078471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,1536,0.12496977382236057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,1536,0.09872533215416802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,1024,0.07302400138643053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,1024,0.09399466382132636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,256,0.01646577815214793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,768,0.07891733116573758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,768,0.0587715572781033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,512,0.04601600103908115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,512,0.06304977999793158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,256,0.035530666510264076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,256,0.047817776600519814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,32,0.012888888518015543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,6144,128,0.03825777769088745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,64,0.031960888041390315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,32,0.03167555398411221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,512,0.022073777185546026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,128,0.013901333014170328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,6144,64,0.01238844460911221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,6144,128,0.03263288736343384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,51200,1.3276151021321614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,65536,1.6388311386108398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,16384,0.44254133436414933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,12288,0.3414915667639838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,16384,1.0335288577609592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,16384,1.060524410671658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,12288,0.7975235515170627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,10240,0.29251734415690106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,12288,0.8098488913642036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,10240,0.5493520100911459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,8192,0.22961778110928008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,65536,3.9956016540527344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,51200,3.075046327379015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,10240,0.6876639790005155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,8192,0.4382950994703505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,6144,0.1736373371548123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,8192,0.5458195474412706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,7168,0.389831993314955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,5120,0.13481067286597356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,6144,0.3314106729295519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,7168,0.4746818012661404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,51200,3.2427999708387585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,4096,0.10440444284015232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,65536,4.143053266737196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,6144,0.4202586544884576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,3584,0.08965777688556248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,5120,0.2770124541388618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,3072,0.07724622223112318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,5120,0.35140087869432235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,4096,0.21738221910264757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,3584,0.18804089228312174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,2560,0.06770755847295125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,4096,0.27312710550096303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,3584,0.2422800064086914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,3072,0.16006222036149767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,2048,0.052523556682798594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,7168,0.1898053354687161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,1536,0.04566488994492424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,3072,0.20715022087097168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,1024,0.030750221676296655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,2560,0.13527199957105848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,2560,0.17555199729071724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,2048,0.14804532792833117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,768,0.02325422234005398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,1536,0.09115822447670831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,1536,0.11696355872684056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,1024,0.06611822048823039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,1024,0.08823111322191025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,256,0.013775111072593264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,768,0.07478044430414836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,768,0.052483555343416005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,512,0.05942400296529134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,512,0.042021334171295166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,256,0.043776889642079674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,64,0.010801778071456485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,32,0.011982222398122152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,5120,128,0.035122666094038225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,128,0.028938667641745672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,64,0.028777778148651123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,32,0.028099556763966877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,2048,0.11310133669111465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,512,0.01794399983353085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,5120,128,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,5120,256,0.03258400162061056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,51200,0.9684257507324219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,65536,1.3089528613620334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,16384,0.34680888387891984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,12288,0.2801920043097602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,16384,0.8032968839009603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,12288,0.6552177535163032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,10240,0.2229857709672716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,16384,0.9813867145114474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,12288,0.7633991241455078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,8192,0.19856354925367567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,10240,0.5013048913743761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,7168,0.15650222036573622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,10240,0.6237911118401421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,8192,0.40043022897508407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,6144,0.1279875569873386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,8192,0.49663909276326496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,7168,0.35611645380655926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,5120,0.10507822036743164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,7168,0.440519995159573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,51200,2.7399270799424915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,6144,0.3009866608513726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,6144,0.37873244285583496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,4096,0.08150488800472684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,3584,0.07180800040562947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,5120,0.25389689869350857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,4096,0.19730756017896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,5120,0.3187866740756565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,3072,0.05953688753975762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,4096,0.25347643428378636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,3584,0.17118488417731392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,2560,0.053230222728517324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,3584,0.22289776802062988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,3072,0.1450764470630222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,51200,2.994824939303928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,2048,0.045924444993337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,3072,0.1921937730577257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,1536,0.03404711021317376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,2560,0.122707552380032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,2560,0.16309689150916204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,1024,0.025060445070266724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,2048,0.10054400232103135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,2048,0.13577866554260254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,768,0.020261334048377145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,1536,0.08098222149742974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,1536,0.10820977555380927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,512,0.014797333214018079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,1024,0.05905244747797648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,1024,0.08136444621615939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,65536,3.462110307481554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,256,0.011969777444998423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,768,0.06892266538408068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,512,0.0539955563015408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,128,0.010732444624106089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,256,0.0410515566666921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,256,0.028216888507207234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,64,0.00979288915793101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,4096,32,0.010045333041085137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,128,0.0329422222243415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,128,0.025528889563348558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,64,0.02530844509601593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,32,0.025068443682458665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,4096,65536,3.8307456970214844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,768,0.04725689027044508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,4096,512,0.03632622294955783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,51200,0.8955813513861762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,65536,1.2185128529866536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,16384,0.3143804338243273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,12288,0.23221956359015572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,16384,0.7649466726515027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,10240,0.20533866352505156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,12288,0.5893777741326226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,16384,0.9796844058566623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,12288,0.7282017601860894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,8192,0.15942045052846274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,10240,0.47044801712036133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,7168,0.1307564444012112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,8192,0.379497766494751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,10240,0.6129253175523546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,51200,2.502272923787435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,6144,0.11807821856604682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,8192,0.5179520183139378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,65536,3.3045137193467884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,7168,0.3323226769765218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,5120,0.09354666868845622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,4096,0.07236444287829928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,6144,0.2860026624467638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,7168,0.43454933166503906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,5120,0.24445509910583496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,6144,0.3760337829589844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,3584,0.07045511404673259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,5120,0.31627199384901256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,4096,0.1900728940963745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,3072,0.0605600012673272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,4096,0.25179733170403373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,2560,0.046448889705869884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,3584,0.16390044159359402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,3584,0.21998311413658989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,3072,0.13885600037044948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,3072,0.19172710842556426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,2560,0.1172951062520345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,2560,0.16185600227779812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,1536,0.029655112160576716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,1024,0.020984888076782227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,51200,2.973584916856554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,2048,0.13383021619584826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,65536,3.797980414496528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,768,0.01768977774514092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,1536,0.07694933149549696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,1536,0.10750222206115723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,512,0.0140346669488483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,1024,0.05528533458709717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,1024,0.08078666528065999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,256,0.010570666856235929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,768,0.0681697792477078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,768,0.044590221510993115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,128,0.009163555171754625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,512,0.052617778380711876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,64,0.008636444807052612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,256,0.03971288932694329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,256,0.026455110973782007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3584,128,0.03183199961980184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,128,0.02404266595840454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,32,0.009708444277445475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,64,0.023317333724763658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,32,0.023370666636361018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3584,2048,0.03984533415900336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,2048,0.09575111336178249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,51200,0.7304906845092773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,65536,0.9943759706285266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3584,512,0.034259554412629865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,16384,0.2611306773291694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,12288,0.19587288962470162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,16384,0.7239182260301379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,12288,0.5456657939487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,10240,0.17160977257622612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,16384,0.938852416144477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,12288,0.7005182372199165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,10240,0.448595576816135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,8192,0.14049332671695286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,51200,2.3160088857014975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,8192,0.35924800237019855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,7168,0.1196826696395874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,10240,0.5860133171081543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,8192,0.48992178175184464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,6144,0.1080720027287801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,65536,2.9672044118245444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,7168,0.3160293367173937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,5120,0.08231733242670695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,7168,0.42654577891031903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,6144,0.2760639985402425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,4096,0.0652186671892802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,6144,0.36135289404127335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,5120,0.22655555937025282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,3584,0.05933155616124471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,5120,0.3047768804762098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,4096,0.17841955025990805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,3072,0.0499288903342353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,4096,0.24647198783026802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,51200,2.8500008053249783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,3584,0.15421333577897814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,2560,0.04144000013669332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,3584,0.21193956004248726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,2048,0.03322844372855292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,3072,0.13178577688005236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,1536,0.027664000789324444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,65536,3.6363326178656687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,2560,0.1553573343488905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,2048,0.09030044741100735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,1024,0.019288000133302476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,2048,0.12995821899837917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,768,0.01555999947918786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,1536,0.06948000192642212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,1536,0.10310666428671943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,1024,0.07783910963270399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,1024,0.051354666550954185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,256,0.010665777656767102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,768,0.04176000091764662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,768,0.06422844198015001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,128,0.009215999808576372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,512,0.051649779081344604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,256,0.02517066730393304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,64,0.009700444837411245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,128,0.02269422180122799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,32,0.008617777791288164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,64,0.021651556094487507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,32,0.021692444880803425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,3072,0.1824657784567939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,2560,0.1106026636229621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,3072,512,0.012481778032249875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,3072,512,0.032285332679748535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,256,0.03849777910444472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,3072,128,0.030583110120561387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,51200,0.6280835469563802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,16384,0.22214755747053358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,12288,0.17350133260091147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,16384,0.664206239912245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,12288,0.5177475611368815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,65536,0.8460728857252332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,16384,0.9072880215115018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,10240,0.13157422012752956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,8192,0.10913244220945571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,12288,0.6708639992607964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,10240,0.4224088986714681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,8192,0.3447599940829807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,7168,0.09801955355538262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,51200,2.155125300089518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,65536,2.7494445376925998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,6144,0.08390488889482285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,8192,0.45560264587402344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,7168,0.3010844389597575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,5120,0.07117155525419447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,6144,0.2574675612979465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,7168,0.40138488345676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,4096,0.047566221819983594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,6144,0.35126754972669816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,5120,0.21544622050391304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,3584,0.048919111490249634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,4096,0.16971555021074083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,5120,0.2927813265058729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,4096,0.23190487755669487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,3584,0.14654933081732854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,3584,0.20451645056406656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,2560,0.03091199861632453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,3072,0.1244657834370931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,3072,0.17554133468204072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,2560,0.10504266950819229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,10240,0.5648870997958714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,65536,3.4860354529486766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,1536,0.022094221578703985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,2048,0.08578488561842178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,1024,0.01588444411754608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,2048,0.1240337822172377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,1536,0.0988924437099033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,1536,0.06506222486495972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,1024,0.04841599861780802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,1024,0.07454133033752441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,768,0.03860888878504435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,512,0.010285333626800114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,512,0.03019555409749349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,3072,0.03864355550871955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,256,0.00794044468137953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,512,0.04812711146142748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,256,0.023278221487998962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,2048,0.02586488922437032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,128,0.006956444846259222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,256,0.037119110425313316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,64,0.006592000110281839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,2560,0.14899110794067383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,128,0.02985244327121311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,128,0.020804444948832195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,32,0.006762666834725275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,64,0.020027556353145175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2560,32,0.019928000039524503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2560,768,0.01277955538696713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,768,0.06151466899447971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,65536,0.5967769092983669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,51200,0.5043022367689345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,16384,0.1767431100209554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2560,51200,2.7265120612250437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,12288,0.1300391091240777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,16384,0.6577813360426161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,12288,0.4718453089396159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,10240,0.10872888565063477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,16384,0.8658400111728244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,8192,0.08223644230100843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,12288,0.6494897736443414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,51200,1.9820550282796223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,10240,0.395414219962226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,7168,0.08296177784601848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,8192,0.3190266556209988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,10240,0.540196418762207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,65536,2.520318137274848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,6144,0.06417777803209093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,5120,0.05359377794795566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,7168,0.28115823533799916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,8192,0.4368080033196344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,6144,0.24182489183213976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,4096,0.045351111226611666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,7168,0.38512089517381454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,5120,0.20178043842315674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,6144,0.33394845326741535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,3584,0.03870933254559835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,5120,0.28068089485168457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,4096,0.15831377771165636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,4096,0.22214667002360025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,2560,0.029990222718980577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,3584,0.13699555397033691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,3584,0.19479821787940133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,51200,2.6058612399631076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,3072,0.11641244093577068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,2048,0.024829333027203877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,3072,0.16786932945251465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,1536,0.01871555546919505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,2560,0.09778666496276855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,2560,0.1430613332324558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,2048,0.08064888583289252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,1024,0.014475555883513557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,1536,0.06071644359164768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,768,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,65536,3.3202781677246094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,1024,0.043460445271597974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,512,0.009770666559537252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,1024,0.06922399997711182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,768,0.058851553334130176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,768,0.03571022219128079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,256,0.007831110722488826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,128,0.006969778074158563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,512,0.04612177941534254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,512,0.0281057788266076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,256,0.03533422284656101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,256,0.021640888518757288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,32,0.006677333265542984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,128,0.028879112667507593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,128,0.019223110543357003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,64,0.018529777725537617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,2048,32,0.01846844454606374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,3072,0.03413777881198459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,65536,0.5239484575059679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,51200,0.3985324435763889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,2048,0.11911022663116455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,2048,1536,0.09486666652891372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,16384,0.14057066705491808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,12288,0.1072346634334988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,2048,64,0.006589333216349284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,16384,0.5892017682393392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,12288,0.468980418311225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,10240,0.08744444449742635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,16384,0.812004460228814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,8192,0.07757066355811225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,12288,0.6151626904805502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,10240,0.3788168960147434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,7168,0.06513422065311007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,51200,1.8394169277615016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,10240,0.5160329076978896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,8192,0.302495108710395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,6144,0.05669333537419637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,8192,0.4172622097863092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,7168,0.26607023345099556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,5120,0.04431910978423225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,6144,0.22899021042717826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,7168,0.3681013319227431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,4096,0.03478755553563436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,6144,0.3184435632493761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,5120,0.19139111042022705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,3584,0.03012977706061469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,5120,0.2683928807576497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,4096,0.15046044190724692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,3072,0.02767733401722378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,4096,0.21206133895450166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,3584,0.13011911180284289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,3584,0.1851875517103407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,2560,0.023174222972657945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,3072,0.1098782221476237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,51200,2.483197318183051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,2048,0.019834667444229126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,3072,0.15969867176479763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,65536,3.1703635321723094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,1536,0.014461333552996317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,2560,0.09235999981562297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,2560,0.1363448831770155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,1024,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,2048,0.07591378026538424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,2048,0.11343467235565186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,768,0.009689778089523315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,65536,2.35316891140408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,1536,0.09060444434483846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,1536,0.059228446748521596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,1024,0.040192888842688665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,1024,0.06601778003904554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,512,0.00795999997191959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,256,0.006962666908899943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,768,0.033259554041756526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,128,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,768,0.05578222539689806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,64,0.005548444473081165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,512,0.02640266716480255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,512,0.044065776798460216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,256,0.019914666811625164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,128,0.017515555024147034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,128,0.02752444479200575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,64,0.016876444220542908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1536,32,0.01683911184469859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,65536,0.3398275640275743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,51200,0.28773244222005206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,16384,0.09449422359466553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,16384,0.5699866612752279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,12288,0.07058133019341363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1536,256,0.034621334738201566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,16384,0.7868062125311958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,10240,0.059896886348724365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,12288,0.41750489340888125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,10240,0.3498364554511176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,12288,0.5871946546766493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,8192,0.0484862228234609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,65536,2.165668487548828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,10240,0.49231735865275067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,8192,0.28188443183898926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,7168,0.040778666734695435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,6144,0.034854223330815635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,8192,0.398235559463501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1536,32,0.005591111050711737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,7168,0.2482008934020996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,5120,0.02943377693494161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,51200,2.36411370171441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,4096,0.024413333998786077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,6144,0.21351467238532174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,7168,0.3517671161227756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,3584,0.022436444958051045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,6144,0.3039795557657878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,5120,0.1784720023473104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,5120,0.25598756472269696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,4096,0.14029422071244982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,4096,0.2024844487508138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,3584,0.12018756071726482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,2560,0.01705777810679542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,51200,1.7020577324761286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,3584,0.17698666784498426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,65536,3.022135204739041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,3072,0.101565334531996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,3072,0.15223999818166098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,1536,0.012031111452314587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,2560,0.12997244464026556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,1024,0.009375111096435124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,2048,0.07044621970918444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,2048,0.10774133602778117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,1536,0.05404533280266655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,1536,0.08601955572764079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,1024,0.03699644406636556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,1024,0.06270133124457465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,512,0.006625777731339137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,768,0.053047110637029014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,256,0.0053546664615472155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,512,0.02441066669093238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,512,0.04255200094646878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,128,0.004599110947714912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,256,0.018239999810854595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,256,0.03276088833808899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,1024,128,0.02632177703910404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,128,0.016135111451148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,64,0.0042168887125121225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,3072,0.019835554891162448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,32,0.004212444441186057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,64,0.0155102229780621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,32,0.015126221709781222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,2048,0.014767110347747803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,65536,0.27562665939331055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,2560,0.08573777808083428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,51200,0.22699912389119467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,1024,768,0.007962666451931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,16384,0.07134933604134454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,1024,768,0.030935999419954088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,12288,0.05643466446134779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,16384,0.5364382002088759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,12288,0.40457865926954484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,10240,0.04682933290799459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,16384,0.7833369043138293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,12288,0.5849244329664443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,10240,0.3399395677778456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,8192,0.03911911116706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,51200,1.6483644909328883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,10240,0.4912737740410699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,7168,0.03228800164328681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,6144,0.02737422287464142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,8192,0.27438399526807994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,65536,2.110332489013672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,5120,0.023330666952663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,7168,0.24154755804273817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,6144,0.2081377771165636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,7168,0.3494444423251682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,4096,0.019347555107540555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,6144,0.3029048972659641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,5120,0.17367377546098497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,5120,0.25553777482774526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,51200,2.362450705634223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,4096,0.13663733005523682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,3072,0.01590488851070404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,4096,0.2013333373599582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,2560,0.013622221847375235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,3584,0.11774933338165283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,3584,0.17613422870635986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,3072,0.09894577662150066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,2048,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,3072,0.15205689271291098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,1536,0.010055999788973067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,2560,0.08358666631910537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,2560,0.1296915610631307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,1024,0.008012444608741337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,2048,0.06805688805050321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,65536,3.0112107594807944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,2048,0.10760621892081366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,768,0.0069217777086628815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,1536,0.051860445075564914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,1536,0.08558222320344712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,512,0.005883555445406172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,1024,0.03559733430544535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,1024,0.06294577651553683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,256,0.004911111046870549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,768,0.02980355421702067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,768,0.05387377738952637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,128,0.004242666479614046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,512,0.02368800010946062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,512,0.04186844494607714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,64,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,256,0.03239288926124573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,32,0.004019555532270008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,256,0.01758577757411533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,128,0.025761778155962627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,128,0.01518133282661438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,64,0.014676445060306124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,768,32,0.014429334137174817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,65536,0.2056302229563395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,51200,0.1641813384162055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,16384,0.053448888990614146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,16384,0.5160862074957954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,12288,0.040539556079440646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,16384,0.7461582289801704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,768,8192,0.3968079884847005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,10240,0.035750223530663386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,12288,0.3899511231316461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,768,3584,0.017860444055663217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,8192,0.026622222529517278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,10240,0.3280453417036268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,51200,1.5854817496405706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,12288,0.5567030906677246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,7168,0.0221377776728736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,8192,0.26433245340983075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,10240,0.46725956598917645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,6144,0.0191600008143319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,65536,2.023775100708008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,7168,0.23266755210028756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,5120,0.01686044368478987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,7168,0.3336168924967448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,6144,0.2001955509185791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,4096,0.014554666148291694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,6144,0.2884133391910129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,5120,0.16675289471944174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,51200,2.245361751980252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,3584,0.012616000241703458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,5120,0.2434204419453939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,3072,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,4096,0.1317626635233561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,4096,0.1922924386130439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,2560,0.010383110907342698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,3584,0.16776711410946318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,3584,0.11289066738552517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,3072,0.09486311011844212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,3072,0.14474222395155165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,2048,0.00867733359336853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,1536,0.007653333246707916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,2560,0.08012000057432386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,65536,2.8674568600124783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,2560,0.12321066856384277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,2048,0.1027253336376614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,1024,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,1536,0.04845777816242642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,768,0.00555377784702513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,1536,0.08142844173643324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,512,0.004871110949251386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,1024,0.0594924423429701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,768,0.0505600008699629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,768,0.028424888849258423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,256,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,8192,0.3783448802100287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,512,0.022859555151727464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,512,0.04010755485958523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,128,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,64,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,256,0.030866665972603693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,512,128,0.025047111842367385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,128,0.014431110686726041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,64,0.013750221994188098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,32,0.013782222237851886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,2048,0.06503466765085857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,51200,0.09736710786819458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,1024,0.034268445438808866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,512,256,0.01682044400109185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,512,32,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,16384,0.03786755601565043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,65536,0.12383377552032471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,12288,0.02903644575013055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,16384,0.4964070849948459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,10240,0.021968000464969214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,12288,0.3756284448835585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,65536,1.9468097686767578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,8192,0.01738666660255856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,12288,0.5527733167012533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,10240,0.31489600075615776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,7168,0.01584533353646596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,51200,1.5211706161499023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,8192,0.25462044609917533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,6144,0.01383733335468504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,7168,0.2237617704603407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,8192,0.3756222195095486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,5120,0.012626666989591388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,7168,0.33088800642225474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,65536,2.8433581458197703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,6144,0.2869386672973633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,5120,0.16093156072828504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,51200,2.2267394595675998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,5120,0.24168178770277235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,3584,0.010011555420027839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,16384,0.7301671240064832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,4096,0.12637955612606472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,3072,0.009023110899660323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,4096,0.19074932734171549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,2560,0.008159110943476358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,3584,0.16661511527167425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,3072,0.09051999780866836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,3072,0.14364177650875515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,2048,0.006989333364698622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,2560,0.0759119987487793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,10240,0.46440712610880536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,1536,0.006256000035338932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,2560,0.122143997086419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,1024,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,2048,0.06184177928500705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,2048,0.10168444448047215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,768,0.004880889008442561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,1536,0.04614311125543383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,1024,0.032476445039113365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,1024,0.05968799855973986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,6144,0.19304354985555014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,768,0.027087110612127516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,768,0.05033066537645128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,256,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,512,0.021871111459202234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,512,0.03958666655752394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,128,0.003351111171974076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,256,0.030541333887312148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,256,0.015799111790127225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,4096,0.01036177741156684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,64,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,32,0.003240888938307762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,128,0.024326221810446844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,128,0.013618666264745923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,64,0.01277599980433782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,65536,0.09566844171947902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,51200,0.07644000318315294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,3584,0.10817066828409831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,256,1536,0.08096888992521498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,16384,0.03083555565940009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,256,512,0.0041626666982968645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,256,32,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,16384,0.48628711700439453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,12288,0.022429333792792425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,10240,0.01628800067636702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,16384,0.7269644207424588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,51200,1.4889716042412653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,8192,0.01366666704416275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,12288,0.3677893214755588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,65536,1.9074728224012587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,10240,0.3087564574347602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,7168,0.012558221817016602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,12288,0.5521599981519911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,6144,0.011416888899273343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,8192,0.24902844429016113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,10240,0.46297423044840497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,5120,0.009773333039548662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,7168,0.2192844417360094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,8192,0.37444265683492023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,6144,0.18860977225833467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,7168,0.33054934607611763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,51200,2.2208614349365234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,5120,0.15727821985880533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,6144,0.2857982317606608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,3584,0.007882666256692674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,3072,0.007251555720965068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,5120,0.24126044909159342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,4096,0.12372267246246338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,4096,0.1905804475148519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,2560,0.0067528887755341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,3584,0.10582133134206136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,3584,0.16601244608561197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,2048,0.005767999837795894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,3072,0.08854489194022284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,3072,0.1428933276070489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,1536,0.0052586665583981415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,2560,0.12194844086964925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,2560,0.07414488659964667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,1024,0.004243555582231945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,2048,0.05986933575736152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,2048,0.1012115544743008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,768,0.0038684445122877755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,1536,0.080530669954088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,1536,0.045490665568245776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,512,0.0035582222044467926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,1024,0.03188088867399428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,1024,0.05850311120351156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,256,0.0034888887570963967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,768,0.04996711015701294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,768,0.026429333620601233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,512,0.02125511070092519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,256,0.01517688896920946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,256,0.02979288829697503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,64,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,128,0.013112000293201871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,32,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,64,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,65536,0.08722577492396037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,4096,0.008355555435021719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,128,32,0.012446222205956778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,51200,0.07203555769390531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,16384,0.02933688958485921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,12288,0.019243554936514962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,65536,2.843012491861979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,10240,0.015848888291252982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,12288,0.36693512068854434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,16384,0.48537243737114805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,8192,0.012717333104875354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,7168,0.011410666836632622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,512,0.039637333816952176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,6144,0.010384000009960597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,10240,0.3079040050506592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,8192,0.2487013339996338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,5120,0.009307555854320526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,7168,0.2185466686884562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,4096,0.00794577764140235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,3584,0.007261333366235097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,6144,0.18867822488149008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,3072,0.006598222172922558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,3584,0.10525155729717678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,2560,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,51200,1.4899493323432074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,2048,0.00555377784702513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,3072,0.08825333250893487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,1536,0.004767111192146937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,2560,0.07467022207048205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,1024,0.0041804446114434134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,2048,0.06031644344329834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,1536,0.04493600130081177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,768,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,512,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,65536,1.9063599904378254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,1024,0.03173333406448364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,256,0.0032142222755485107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,768,0.02644088864326477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,512,0.020928000410397846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,128,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,256,0.01514400045077006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,64,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,128,128,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,64,32,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,128,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,65536,0.0879475540584988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,64,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,32,0.012179555164443122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,51200,0.0706204440858629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,16384,0.027115555273161993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,5120,0.1574124495188395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,12288,0.01640888883007897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,64,4096,0.12312889099121094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,10240,0.012067555553383298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,8192,0.01036888857682546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,12288,0.36646223068237305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,8192,0.24839467472500273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,16384,0.48612176047431094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,7168,0.009640889035330879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,6144,0.009000000026490953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,5120,0.01203644441233741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,6144,0.18815555837419298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,7168,0.21870756149291992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,4096,0.010037333601050908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,3584,0.009321778184837764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,4096,0.1233173343870375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,3072,0.007990222010347579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,3584,0.1061591108640035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,2560,0.0075937774446275495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,51200,1.4882062276204426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,3072,0.08886844582027859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,2048,0.005547555370463266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,2560,0.07425777779685126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,1536,0.004567999806669024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,1024,0.0041999999019834726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,2048,0.06018222040600247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,1536,0.044455111026763916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,65536,1.904422124226888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,1024,0.031856000423431396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,512,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,256,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,768,0.02638133366902669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,512,0.020992888344658747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,128,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,64,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,32,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,128,0.013021333350075616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,5120,0.15726310676998562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,64,0.012064889073371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,32,0.011857777833938599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,10240,0.3077813254462348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4096,32,256,0.01482222146458096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4096,32,768,0.0038684445122877755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,12288,3.6744897630479603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,16384,4.795269436306424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,12288,4.18959003024631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,10240,3.4280444251166453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,16384,5.972709231906467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,8192,2.7414639790852866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,7168,2.267527050442166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,10240,3.4243253072102866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,8192,2.658568912082248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,7168,2.3058533138699002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,6144,1.8491884867350261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,5120,1.634961764017741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,4096,1.2908959918551974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,5120,1.6920222176445856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,6144,1.940592024061415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,3584,1.0830604765150282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,3072,0.997529771592882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,3072,0.9624267154269748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,4096,1.3036461936102974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,3584,1.1772818035549588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,2048,0.6076151000128852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,2560,0.8497724533081055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,1536,0.45513068305121523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,2048,0.6719386842515734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,2560,1.0676986906263564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,1024,0.377222220102946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,768,0.23373156123691133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,1024,0.463481797112359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,1536,0.6684915754530164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,512,0.2074577808380127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,768,0.324074665705363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,256,0.14293866687350804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,512,0.28141334321763783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,128,0.14139910538991293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,64,0.09989244408077663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,256,0.24696087837219238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,32,0.1265315612157186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,128,0.22644623120625815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,64,0.23106845219930014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,32,0.2342533270517985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,65536,51200,15.37738037109375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,16384,4.036011589898004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4096,128,128,0.023656888140572443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,12288,2.921987533569336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,16384,4.6237335205078125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,12288,3.3049956427680125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,10240,2.5989422268337674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,10240,2.7221929762098522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,8192,2.1231689453125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,51200,12.332801818847656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,8192,2.1067235734727645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,7168,1.761768870883518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,65536,51200,26.102345784505207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,7168,1.8559065924750433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,5120,1.2361208597819011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,6144,1.6130861706203883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,6144,1.5870986514621312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,5120,1.3424897723727758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,4096,0.9603226979573568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,3584,0.8872195349799262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,3584,0.9038595623440213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,3072,0.7049582269456652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,4096,1.0395547019110787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,65536,15.52852037217882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,3072,0.9027946260240344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,2048,0.5009439786275228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,2048,0.5409110916985406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,2560,0.6579626931084527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,1536,0.3956266774071588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,2560,0.5456346405877007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,1536,0.4290364318423801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,512,0.1560693316989475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,1024,0.24201689826117623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,1024,0.31926488876342773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,256,0.11737599637773301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,512,0.2144328885608249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,256,0.20158310731252035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,64,0.07435199949476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,128,0.0858995583322313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,32,0.07850755585564508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,128,0.18741067250569662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,768,0.37374220954047305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,64,0.18277955055236816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,32,0.18239288859897188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,51200,768,0.19194222821129692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,16384,1.2060897615220811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,12288,0.8997440338134766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,16384,1.7483306460910375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,51200,19.475753784179688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,10240,0.8183929125467936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,12288,1.2765528361002605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,51200,3.879912906222873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,8192,0.6865413453843859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,10240,1.0743563969930012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,7168,0.5814302232530382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,8192,0.8292729059855143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,6144,0.4270808961656358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,65536,4.877687242296007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,7168,0.870572461022271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,5120,0.3791182306077745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,4096,0.3123688962724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,3584,0.2649075455135769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,5120,0.5539920065138075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,4096,0.40916532940334743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,6144,0.7692506578233508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,3072,0.2442533440060086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,3584,0.3744835588667128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,2560,0.19469332695007324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,3072,0.31006932258605957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,2048,0.17971289157867432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,2560,0.2617795467376709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,1024,0.08494666549894546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,2048,0.21646666526794434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,768,0.06774666574266222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,1536,0.1695635583665636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,1024,0.12693066067165798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,512,0.04977155394024319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,256,0.035389333963394165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,768,0.10241599877675374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,128,0.03128711051411099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,512,0.0839280022515191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,256,0.07646933529112074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,64,0.028267555766635474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,128,0.06771466467115614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,32,0.03211999932924906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,64,0.0674275557200114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,32,0.06836177905400594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,16384,1536,0.11384088463253444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,51200,7.5144500732421875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,16384,0.8984168370564779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,51200,65536,25.424219767252605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,12288,0.755975087483724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,16384,1.444300439622667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,16384,65536,9.618759155273438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,51200,2.828342225816515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,10240,0.6332035594516331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,8192,0.5211377673678929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,12288,1.0715582105848525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,10240,0.8655671013726128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,7168,0.44026933776007754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,6144,0.3538915581173367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,65536,3.7569732666015625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,8192,0.7187751134236654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,5120,0.3048986593882243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,4096,0.2472613387637668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,6144,0.5104915301005045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,7168,0.790196418762207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,4096,0.3375875684950087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,5120,0.5135928789774576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,3584,0.29027822282579213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,3072,0.20514310730828178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,2560,0.14782488346099854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,3072,0.24955466058519152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,2048,0.1313191122478909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,1536,0.09453777472178142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,2560,0.21334044138590494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,1024,0.06502488586637709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,1536,0.14062400658925375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,768,0.052188442813025586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,512,0.03830400109291077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,2048,0.1759199963675605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,256,0.028402666250864666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,768,0.08601422442330255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,512,0.0689271092414856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,128,0.024355555574099224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,256,0.058509336577521436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,64,0.020804444948832195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,32,0.021024000313546922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,128,0.05397689011361864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,12288,3584,0.2164106633928087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,64,0.05414666732152303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,51200,5.5714772542317705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,32,0.05504177676306831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,1024,0.104001780351003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,16384,0.7524728775024414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,12288,0.6399040222167969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,12288,65536,7.3191333346896705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,12288,0.9093892839219836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,16384,1.2571101718478732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,10240,0.5480711195203993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,8192,0.38739289177788633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,51200,2.3998692830403647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,7168,0.36127199067009824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,6144,0.31199555926852757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,8192,0.6082568698459202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,65536,3.0099707709418406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,7168,0.5570915540059408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,5120,0.2797519895765516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,6144,0.49811824162801105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,4096,0.20019111368391249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,5120,0.3784133328331842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,3584,0.18718132707807753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,3072,0.14572621716393366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,4096,0.2980479929182264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,2560,0.13019822703467474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,3584,0.26412444644504124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,3072,0.22220888402726915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,1536,0.08440799845589532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,1024,0.056906667020585805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,10240,0.7739760080973307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,1536,0.12274311648474799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,2048,0.17517511049906412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,768,0.04153777824507819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,512,0.03203199969397651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,256,0.025314667158656653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,1024,0.0927191111776564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,768,0.07492978043026395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,128,0.02128977742460039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,512,0.06168711185455322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,64,0.01885777711868286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,256,0.05259911219278971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,32,0.019835554891162448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,128,0.04766577813360426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,64,0.04756444361474779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,32,0.04791555470890469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,10240,2048,0.09770577483707005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,51200,4.878470102945964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,2560,0.21251377794477674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,16384,0.534312884012858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,12288,0.4215564462873671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,10240,0.37509245342678493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,10240,65536,6.231021457248264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,12288,0.806247976091173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,51200,1.993551042344835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,8192,0.301238218943278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,7168,0.26837865511576336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,10240,0.7253573205735949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,8192,0.5265928904215494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,6144,0.24668799506293404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,7168,0.49440977308485246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,5120,0.1969697740342882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,4096,0.1573128832711114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,3584,0.1333084503809611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,5120,0.37705334027608234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,4096,0.257841772503323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,16384,1.0993004904852974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,3072,0.11417155795627171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,2560,0.10921600129869248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,3584,0.2365964518653022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,2048,0.07812355624304877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,3072,0.19481866889529756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,2560,0.16832533147599962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,1024,0.04507466819551256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,2048,0.13884711265563965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,1536,0.10794577995936076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,768,0.034669333034091525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,65536,2.725823084513346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,1024,0.08171111345291138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,512,0.024392000503010217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,256,0.019254222512245178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,768,0.06583733028835721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,512,0.05379555622736613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,51200,4.0132365756564665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,6144,0.4037937853071425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,128,0.017454221844673157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,256,0.04292533463901944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,64,0.01626488897535536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,32,0.01570755574438307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,128,0.0387733346886105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,64,0.037408000893063016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,32,0.03704444567362467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,8192,1536,0.0605600012673272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,16384,0.5604089101155599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,8192,65536,5.16701168484158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,12288,0.4433146582709418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,16384,0.9962373309665256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,10240,0.3813626766204834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,12288,0.7747768825954862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,51200,1.817383024427626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,8192,0.30341243743896484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,7168,0.25046934021843803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,65536,2.2337892320421004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,6144,0.21786933475070527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,8192,0.5987582206726074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,5120,0.18030667304992676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,7168,0.5252124468485514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,6144,0.3967564370897081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,4096,0.15077600214216444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,3584,0.1185706721411811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,3072,0.10944533348083496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,5120,0.36000532574123806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,4096,0.2744266721937391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,2560,0.08741866879993015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,3584,0.21288800239562988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,2048,0.07378488779067993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,3072,0.18326132827334932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,1536,0.06477777825461493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,1024,0.043473776843812734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,2560,0.1596577829784817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,2048,0.13042222128974065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,768,0.03245155678855048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,512,0.024667556087176006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,1024,0.07604266537560357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,1536,0.10382222466998631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,256,0.018618666463428073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,10240,0.6168933444552952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,128,0.016207999653286405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,512,0.048914667632844716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,64,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,7168,32,0.013938667045699226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,256,0.038726223839653864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,128,0.03496888942188687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,64,0.03446311089727614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,32,0.03359555535846286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,51200,3.6795404222276478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,16384,0.4543440077039931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,12288,0.37497867478264707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,768,0.06296622090869479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,7168,65536,4.62715827094184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,16384,0.9261946148342557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,10240,0.2900328901078966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,51200,1.5467813279893663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,8192,0.23832800653245714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,7168,0.22134844462076822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,12288,0.7227653397454156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,10240,0.572397338019477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,65536,1.9998096889919703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,6144,0.18341510825686982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,8192,0.4665848943922255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,5120,0.1474239958657159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,4096,0.12427200211419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,3584,0.10250577661726211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,7168,0.4219555589887831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,6144,0.3465013239118788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,3072,0.08657422330644395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,4096,0.22651910781860352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,5120,0.34292621082729763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,2560,0.07431288560231526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,2048,0.06579199764463636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,3584,0.2280506557888455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,1536,0.050360000795788236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,1024,0.03635911146799723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,2560,0.16463643974728054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,768,0.029330667522218492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,2048,0.12724799580044216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,512,0.02352622151374817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,1536,0.0928986668586731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,256,0.016913778252071805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,1024,0.06955911053551568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,128,0.014875556031862894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,768,0.05969866779115465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,512,0.043876445955700345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,256,0.0343777769141727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,32,0.015974221958054435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,128,0.031277332040998675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,64,0.03201422095298767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,32,0.03052355514632331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,51200,3.3731492360432944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,3072,0.17191199461619058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,6144,64,0.016185777054892648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,6144,65536,4.196167839898004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,16384,0.36069689856635195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,51200,1.2373723983764648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,12288,0.28640709982977974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,65536,1.6482328838772242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,10240,0.31979287995232475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,8192,0.24371200137668184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,12288,0.6551395522223579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,16384,0.8342729144626193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,7168,0.22202755345238578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,10240,0.5756737920973036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,6144,0.1604000065061781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,8192,0.5108728938632542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,5120,0.12789777914683023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,7168,0.3694942262437608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,4096,0.1036648882759942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,3584,0.0894355575243632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,3072,0.07979555262459649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,5120,0.2607671154869927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,6144,0.377696885002984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,2560,0.06926755772696601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,4096,0.20394844479031035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,3584,0.17734132872687447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,2048,0.06268977456622653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,1536,0.04247022337383694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,3072,0.15558400419023302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,1024,0.035813334915373064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,768,0.022239999638663396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,2560,0.12789421611362034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,512,0.01735911104414198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,2048,0.1089271108309428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,256,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,1536,0.08512088987562393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,1024,0.06289066871007283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,128,0.011367110742463006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,768,0.0518124434683058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,32,0.010092444717884064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,512,0.039192888471815325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,256,0.03070311082734002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,128,0.028143111202451918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,64,0.028135998381508723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,32,0.028134223487642076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,51200,3.091555489434136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,16384,0.3154719935523139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,5120,65536,3.7361547682020397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,12288,0.24499289194742838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,51200,0.8689226574367948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,10240,0.205567995707194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,65536,1.298267576429579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,5120,64,0.01000355515215132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,16384,0.7681004206339518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,8192,0.16454133722517225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,7168,0.14574133025275335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,6144,0.12269422743055557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,12288,0.5622497664557563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,5120,0.10158577892515396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,10240,0.5060924424065484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,4096,0.08207377460267809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,7168,0.33334843317667645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,8192,0.4671946631537543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,6144,0.28530934121873647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,3584,0.075126224093967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,5120,0.23657245106167266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,2560,0.05583110782835218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,4096,0.18714222643110487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,2048,0.043769776821136475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,3584,0.16114844216240778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,3072,0.13804354932573107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,1024,0.0251857770813836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,2560,0.1169466707441542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,2048,0.09587822357813518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,768,0.019479999939600628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,1536,0.07658666372299194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,512,0.014531556102964612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,256,0.011931555966536203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,1024,0.05590133534537422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,768,0.04562755425771078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,128,0.00978488889005449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,512,0.035190221336152815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,64,0.008967999782827165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,256,0.027451554934183758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,128,0.025018667181332905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,64,0.024659555819299486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,51200,2.5759874979654946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,32,0.02437955637772878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,3072,0.07355199919806586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,1536,0.03615022367901272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,4096,65536,3.261793772379557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,16384,0.2882311079237196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,51200,0.868226687113444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,65536,1.0029581917656791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,12288,0.22948622703552246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,10240,0.19677510526445177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,4096,32,0.009096889032257928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,8192,0.15200444062550864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,7168,0.1318933301501804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,12288,0.5349457528856065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,16384,0.7046044667561849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,6144,0.10490222109688653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,10240,0.513246218363444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,5120,0.08717866738637288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,4096,0.06971466541290283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,6144,0.27057332462734646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,7168,0.351074669096205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,3584,0.06964088810814752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,5120,0.2288266552819146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,3072,0.05816533168156942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,4096,0.18046755260891387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,2560,0.04319733381271362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,3584,0.16289156013064915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,2048,0.03887288769086202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,3072,0.13448177443610296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,1536,0.029167999823888142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,1024,0.021133333444595337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,2560,0.11147733529408772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,2048,0.09310399823718601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,768,0.016178665889634024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,1536,0.07324088944329156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,512,0.013003555436929068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,51200,2.3442755805121527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,1024,0.053223109907574125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,256,0.010038221875826517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,128,0.009014222357008193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,768,0.04357777701483833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,64,0.008465777668688033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,512,0.03304977880583869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3584,32,0.00833333366447025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,256,0.025751999682850305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,128,0.023424888650576275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,64,0.02349688940578037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,32,0.0229777776532703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,8192,0.4488657845391168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3584,65536,3.0181094275580516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,16384,0.23218933741251627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,12288,0.18287821610768637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,10240,0.16488088501824275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,8192,0.1294800043106079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,16384,0.6641057862175835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,65536,0.9297537273830838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,10240,0.4213431146409776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,12288,0.49946753184000653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,7168,0.11716000239054362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,6144,0.09987911250856187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,5120,0.0783991085158454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,8192,0.3523857858445909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,4096,0.06477422184414335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,6144,0.25594133800930446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,3584,0.05504177676306831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,7168,0.35704978307088214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,5120,0.21319999959733751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,3072,0.04877600073814392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,2560,0.039120889372295804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,4096,0.17046933703952363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,2048,0.03295288814438714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,3584,0.1440462271372477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,1536,0.026731555660565693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,3072,0.12961333327823216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,1024,0.019448000523779128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,2560,0.10519111156463623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,768,0.01552888916598426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,512,0.01240533341964086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,2048,0.08710933393902248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,1536,0.06509333186679415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,1024,0.04931111137072245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,768,0.040361778603659734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,128,0.008616888688670265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,512,0.03087377879354689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,64,0.007489778101444244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,51200,0.7284346686469184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,32,0.007607999775144789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,256,0.024102222588327196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,128,0.021996445126003687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,64,0.021149333980348375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,51200,2.164598253038194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,32,0.021369778447681006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,16384,0.21877777576446533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,12288,0.15371021959516737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,51200,0.566632005903456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,3072,65536,2.7506205240885415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,65536,0.7927555508083768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,16384,0.6280835469563802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,10240,0.1326506667666965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,8192,0.1126977735095554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,7168,0.09016178051630656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,3072,256,0.010689777632554373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,6144,0.08006133635838826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,12288,0.4955155584547255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,10240,0.39657778210110134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,5120,0.06756977902518378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,8192,0.32093334197998047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,4096,0.054541332854164966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,6144,0.24202399783664277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,3584,0.04390577806366814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,7168,0.333663993411594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,3072,0.04066133168008592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,4096,0.17400177319844565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,5120,0.2043671078152127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,2560,0.033957332372665405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,3584,0.13665066825018987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,2048,0.027235555979940627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,3072,0.1175653272204929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,1536,0.023002665903833177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,1024,0.017664889494578045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,768,0.014477334088749357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,2560,0.10335110955768162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,512,0.012256888879670037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,1024,0.04641155401865641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,256,0.008984000318580205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,768,0.03717866539955139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,128,0.007309333317809635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,512,0.03085600005255805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,64,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,51200,2.0248470306396484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,128,0.0203493336836497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2560,32,0.006598222172922558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,64,0.0196106665664249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,32,0.019928000039524503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,65536,2.578367021348741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,65536,0.6185297966003418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,2048,0.0814888874689738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,16384,0.171888894504971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,12288,0.13019377655453152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,256,0.022678222921159532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,10240,0.09320800171958075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,16384,0.5899137920803493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,12288,0.49763732486301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,10240,0.3748844464619954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,7168,0.07604977819654676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,51200,0.45651997460259336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,6144,0.06351021925608318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,8192,0.31244177288479275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,5120,0.05429866578843859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2560,1536,0.06201689110861885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,7168,0.2667608790927463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,4096,0.0429440008269416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,3584,0.039473778671688504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,6144,0.2296746571858724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,51200,1.8720667097303603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,5120,0.19237777921888563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,2560,0.02888622217708164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,4096,0.1497653325398763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,2048,0.024271999796231587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,65536,2.3970247904459634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,3072,0.11080000135633682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,2560,0.09463466538323297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,2048,0.07654044363233778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,768,0.012207110722859701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,1536,0.05730933613247342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,1024,0.04164088765780131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,512,0.009364444348547194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,8192,0.09042488866382176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,256,0.007057777709431118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,768,0.03554133243030972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,128,0.0063528890411059065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,64,0.0059004442559348206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,256,0.02128355536195967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,32,0.006260444306664997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,128,0.018889778190188937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,64,0.018205333087179396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,32,0.018239999810854595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,3072,0.034161776304244995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,65536,0.4523466428120931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,3584,0.12960533301035562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,51200,0.3640480041503906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,1536,0.019325332509146798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,16384,0.13149600558810765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,12288,0.09908355606926812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,2048,1024,0.014764444695578681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,10240,0.07875021961000231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,8192,0.059552000628577344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,7168,0.05219466818703545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,12288,0.41783732838100857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,2048,512,0.027404444085227117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,16384,0.5537155469258627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,8192,0.3005902237362332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,6144,0.04708355665206909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,5120,0.04154400030771891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,7168,0.24926487604777017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,4096,0.03176000052028232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,3584,0.029587556918462116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,3072,0.02574577762020959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,6144,0.21512088510725233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,5120,0.18038488758934867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,4096,0.13984444406297472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,3584,0.12001332971784805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,2048,0.018784888916545443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,1536,0.014490667316648694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,2560,0.08825155761506821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,1024,0.011796444654464722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,2048,0.07150933477613661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,768,0.009630222287442949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,1024,0.03820000092188517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,512,0.007994666695594788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,768,0.0322017769018809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,51200,1.7225706312391493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,256,0.006594666590293248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,512,0.02539644473128849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,128,0.005552000055710475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,65536,2.2039627499050565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,10240,0.3916897773742676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,64,0.004873777843183941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,32,0.005331555588377847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,128,0.017330666383107502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,64,0.016916443904240925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,32,0.01649599936273363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1536,2560,0.022088888618681166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,3072,0.10291555855009292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,65536,0.3499528831905789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,51200,0.27947555647956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,16384,0.0896844466527303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,12288,0.07032710976070829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,10240,0.057265778382619224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,12288,0.3927360110812717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,16384,0.5313990910847982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,8192,0.047841777404149376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,10240,0.33922576904296875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,256,0.0195768889453676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,7168,0.04244800077544319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,6144,0.033803555700514056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,5120,0.02801688843303257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,8192,0.2686266634199354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,4096,0.02234399980968899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,7168,0.23562134636773002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,6144,0.2019617822435167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,3584,0.019753777318530612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,3072,0.017605332864655387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,5120,0.1672595606909858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,2560,0.01570133368174235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,4096,0.13128177324930826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,3584,0.11264177163441975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,2048,0.013287111288971372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,1536,0.011074666347768573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,3072,0.09632088740666707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1536,1536,0.05619555711746216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,1024,0.008672888908121321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,51200,1.604956414964464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,768,0.007646222081449296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,512,0.00657155571712388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,2048,0.06634666522343953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,1536,0.05102044343948364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,256,0.0052435555391841466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,1024,0.03560444381501939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,128,0.004845333182149463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,768,0.030044443077511255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,64,0.0041848888827694785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,65536,2.0415049658881292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,1024,32,0.004521777646409141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,256,0.018225777480337355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,128,0.01593777702914344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,64,0.01514400045077006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,32,0.015192000402344598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,65536,0.2540382279290093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,16384,0.06727288828955756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,51200,0.19757244322035047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,12288,0.0509475568930308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,10240,0.040658666027916804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,8192,0.035234666532940336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,12288,0.37730222278171116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,8192,0.25657865736219615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,7168,0.02986488739649455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,6144,0.025183111429214478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,2560,0.08156710863113403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,5120,0.02239377796649933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,7168,0.22529866960313585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,6144,0.19414844777848986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,1024,512,0.023971555961502924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,4096,0.017879999346203275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,3584,0.01626311077011956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,3072,0.01441333360142178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,4096,0.12619377507103816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,3584,0.10859200027253892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,2560,0.01298577752378252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,2048,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,3072,0.09200000100665623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,1536,0.008969777988062965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,51200,1.540986696879069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,2560,0.07790578073925443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,1024,0.007600888609886169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,2048,0.06360799736446805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,768,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,1536,0.047593779034084745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,1024,0.033964445193608604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,16384,0.4997573428683811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,256,0.004862222406599256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,65536,1.9661636352539062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,512,0.02275288932853275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,64,0.0038657776183552216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,256,0.01720711092154185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,128,0.015107555521859063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,32,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,64,0.014444443914625378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,32,0.014157333307796054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,65536,0.20311200618743896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,5120,0.1613315608766344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,51200,0.16074221664004856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,16384,0.04986844460169474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,512,0.005559111220969095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,12288,0.03835733400450812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,10240,0.3290613227420383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,768,768,0.02862488892343309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,768,128,0.004537777768241035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,10240,0.032313777340783015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,8192,0.023916444844669763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,7168,0.021494223011864558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,12288,0.3682391113705105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,10240,0.3090488910675049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,8192,0.24969334072536895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,6144,0.01904088921017117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,5120,0.016531555189026725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,7168,0.2197697824902005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,4096,0.014075555735164218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,3584,0.01276533305644989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,6144,0.1892497804429796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,5120,0.15724889437357584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,4096,0.12292355961269802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,51200,1.4928578270806208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,3072,0.011343999869293638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,2048,0.00871733327706655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,3072,0.089464889632331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,65536,1.9090889824761286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,2560,0.07562577724456787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,1536,0.007654222349325816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,2048,0.06185866726769341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,1024,0.006072000082996156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,768,0.005527110977305307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,512,0.00488711107108328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,16384,0.48752710554334855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,1024,0.03303733468055725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,256,0.003970666478077571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,768,0.027738667196697656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,128,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,512,0.021984888447655573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,64,0.003546666767862108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,32,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,256,0.01648888819747501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,128,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,64,0.013797333670987023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,65536,0.11493778228759766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,32,0.013422222601042854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,16384,0.03910488883654276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,51200,0.09258044428295559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,12288,0.02721600068940057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,10240,0.02163022259871165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,512,2560,0.010061333576838175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,12288,0.3540151119232178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,16384,0.4679128858778212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,10240,0.29686223136054146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,7168,0.015555555621782938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,6144,0.014215999179416232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,1536,0.045915553967158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,7168,0.21063644356197783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,5120,0.012335110869672565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,6144,0.181731555196974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,4096,0.010632889138327705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,3584,0.0099973330895106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,5120,0.15063556035359701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,4096,0.11767289373609756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,3072,0.008990222381220924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,3584,0.10078044732411702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,2560,0.008635555704434713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,2048,0.007284444239404466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,51200,1.430791113111708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,1536,0.00619911112719112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,2560,0.07158133056428698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,2048,0.058296885755327016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,1024,0.005554666535721884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,768,0.0052133335007561584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,1536,0.04427644279268053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,512,3584,0.10531644688712226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,512,0.004231111043029361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,65536,1.8290159437391493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,8192,0.01682488951418135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,256,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,128,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,768,0.026494221554862127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,64,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,512,0.021249777740902368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,256,32,0.0031964443624019623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,256,0.015807110402319167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,128,0.013491555220550962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,64,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,65536,0.08932355377409194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,32,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,51200,0.07114399804009332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,8192,0.24009243647257486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,16384,0.028956443071365356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,12288,0.022184888521830242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,10240,0.018848000301255118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,8192,0.013360888593726687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,12288,0.3458426793416341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,10240,0.2899991141425239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,8192,0.2346551153394911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,16384,0.4570124414232042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,6144,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,3072,0.08519999848471747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,5120,0.009706666900051964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,7168,0.20592266983456084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,6144,0.17785955799950492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,4096,0.00831822223133511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,256,1024,0.03145600027508206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,3584,0.00795911086930169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,5120,0.14721333980560303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,3072,0.0069848886794514125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,2560,0.0063075555695427795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,4096,0.11504088507758246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,3584,0.09842666652467515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,2048,0.005931555396980709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,3072,0.0834382242626614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,1536,0.005281777845488654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,2560,0.07002933157814874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,1024,0.004507555729813046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,768,0.004159111115667555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,2048,0.05642222033606636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,51200,1.3988658057318792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,1536,0.04231289029121399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,512,0.003839111162556542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,256,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,768,0.02580533259444767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,128,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,64,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,512,0.020614221692085266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,256,0.0151591118839052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,32,0.003198222153716617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,65536,1.7871066199408636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,128,0.012727999852763282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,64,0.0124195557501581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,128,7168,0.012331555287043253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,65536,0.09074933661354913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,51200,0.07332089212205675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,16384,0.026312889324294195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,12288,0.016522667474216886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,10240,0.01276266657643848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,12288,0.34568532307942706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,10240,0.2896088759104411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,16384,0.4561991161770291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,8192,0.013081777426931592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,7168,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,6144,0.010280888941552904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,8192,0.23401689529418945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,7168,0.20586489306555855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,1024,0.03073244293530782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,5120,0.008955555657545725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,4096,0.007963555554548899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,6144,0.1772222254011366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,3584,0.007179555793603261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,3072,0.006596444381607904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,5120,0.1471546623441908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,4096,0.11407644218868679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,2560,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,3584,0.0980808867348565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,2048,0.00543200017677413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,3072,0.08299377891752455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,1536,0.004576888763242298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,51200,1.4004773033989801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,1024,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,768,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,2560,0.06924266947640313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,2048,0.05625600285000271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,512,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,1536,0.042840000655916005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,256,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,128,0.0028560000161329904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,1024,0.030642665094799463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,64,0.0028782222006056043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,768,0.025760889053344727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,64,32,0.0029066666546795103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,512,0.020482665962643094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,65536,1.7872123718261719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,128,0.012794666820102267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,64,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,65536,0.08624177508884007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,32,0.011742221812407175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,51200,0.07017333639992608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,12288,0.014030221435758801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,10240,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,12288,0.34504267904493546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,16384,0.4563048680623372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,10240,0.29004356596204967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,8192,0.01039644413524204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,7168,0.010047111246320937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,6144,0.009322666459613377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,128,32,0.012063110868136087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,5120,0.012031111452314587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,7168,0.20569688744015166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,8192,0.2338471147749159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,4096,0.009744889206356471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,6144,0.17740978135002983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,3584,0.009305777649084726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,3072,0.008620444271299574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,64,256,0.014765333798196582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,3584,0.09883289204703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,2560,0.007644444704055786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,2048,0.0053119998839166425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,3072,0.08323999908235338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,16384,0.025556445121765137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,1536,0.004878222114510006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,51200,1.3983217875162761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,2560,0.07044800122578938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,1024,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,2048,0.05649155378341675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,768,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,512,0.0034862222770849862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,1536,0.04203022188610501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,256,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,1024,0.03053599927160475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,768,0.02552355494764116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,128,0.0028524444335036804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,65536,1.7878328959147136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,64,0.0026391111314296722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3841,32,32,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,256,0.014849777022997538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,128,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,64,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,32,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,5120,0.14712533685896131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,4096,0.114464004834493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3841,32,512,0.020236444142129686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,12288,3.42319827609592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,16384,4.683806949191623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,12288,4.112059699164496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,16384,5.8575041029188375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,16384,5.383232964409722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,10240,3.2256444295247397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,10240,3.372357262505425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,12288,3.8650711907280813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,8192,2.584702173868815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,10240,3.2040479448106556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,8192,2.6105723910861545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,7168,2.206663131713867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,7168,2.23999998304579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,6144,1.9428880479600694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,8192,2.5919973585340714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,7168,2.310703913370768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,6144,1.9182302686903212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,5120,1.4837350845336914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,51200,14.816738552517362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,5120,1.6001030604044597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,6144,1.9563634660508897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,4096,1.2085119883219402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,3584,1.0034799575805664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,4096,1.2805902693006728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,5120,1.6256080203586156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,3584,1.133312013414171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,4096,1.2269911236233182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,3072,0.8953253428141276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,3072,0.9667796028984917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,3584,1.1285386615329318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,2560,0.7052213350931803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,3072,0.9704053666856555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,2048,0.605330679151747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,2560,0.894987530178494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,2048,0.6981671121385363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,2560,0.7978391117519803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,1536,0.4510969056023492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,1024,0.3111964331732856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,1536,0.7195244365268283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,1536,0.5097697575887045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,2048,0.6927439901563855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,768,0.26329512066311306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,1024,0.4174817668067084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,1024,0.49827109442816836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,512,0.18818844689263237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,768,0.3154097663031684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,256,0.14219289355807835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,768,0.32390043470594615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,512,0.2577608956231011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,512,0.3489866786532932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,128,0.10790489117304485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,256,0.19668977790408662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,256,0.24372267723083496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,64,0.12320178084903294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,128,0.1526915497250027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,65536,32,0.08870844708548652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,64,0.22968978352016875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,32,0.22797687848409018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,128,0.2247342268625895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,65536,51200,18.376805623372395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,65536,51200,24.326799180772568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,16384,4.205330742730035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,16384,4.667177836100261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,51200,11.511494954427084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,12288,2.826865726047092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,16384,4.2686949835883246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,65536,14.912667168511284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,12288,3.310652414957682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,12288,3.132864846123589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,10240,2.497155507405599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,10240,2.669832017686632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,8192,1.948336919148763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,51200,18.51719495985243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,10240,2.588902155558268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,8192,2.1236809624565973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,51200,14.391545613606771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,7168,1.6777778201633031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,7168,1.849289788140191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,8192,2.092285368177626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,6144,1.4002248975965712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,7168,1.8133458031548395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,6144,1.5524720085991754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,5120,1.3116596009996202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,5120,1.3215795093112521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,4096,0.9889208475748698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,6144,1.5596977869669597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,5120,1.3319813410441081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,4096,1.0420506795247395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,3584,0.9149973127577039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,3584,0.901792844136556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,3072,0.6961217986212836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,3072,0.7664915720621744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,65536,24.368226793077255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,3584,0.898771603902181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,2560,0.5835413402981228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,2560,0.7296853595309787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,2048,0.5140764448377821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,3072,0.7501457532246908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,2560,0.6357413397894965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,2048,0.5564622349209255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,1536,0.34052356084187824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,4096,1.0231609344482422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,1024,0.23656890127393934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,768,0.1948711077372233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,2048,0.5346168941921657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,1536,0.4236151112450494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,1536,0.6428915659586588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,1024,0.3465369012620714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,512,0.14365688959757486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,768,0.2700044314066569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,256,0.10774044195810954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,65536,20.138431125217014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,512,0.2183368868298001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,128,0.08966400225957234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,512,0.31981155607435435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,256,0.19734133614434135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,256,0.1699146694607205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,64,0.07288444704479642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,128,0.1274062262641059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,51200,32,0.07726933558781941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,128,0.2353395620981852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,64,0.17938221825493705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,32,0.1839991145663791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,51200,1024,0.319452444712321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,51200,768,0.28367378976609975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,16384,1.300353791978624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,16384,1.7404763963487413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,12288,0.8854657808939616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,51200,3.9940842522515188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,16384,1.7602062225341797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,65536,4.894893222384982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,10240,0.8037226465013293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,12288,1.2810960345798068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,8192,0.5239724583095974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,10240,1.068120002746582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,12288,1.2727360195583768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,7168,0.6196124288770888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,8192,0.8641066551208496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,10240,1.149279064602322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,51200,6.812676323784722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,8192,0.828188419342041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,51200,5.590157402886285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,6144,0.45255380206637913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,5120,0.3869022263420953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,6144,0.6308097839355469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,7168,0.735712899102105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,5120,0.6112177636888292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,6144,0.6727742089165581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,4096,0.2824088997311062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,4096,0.4148435592651367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,3584,0.2672204441494412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,65536,8.72292243109809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,3584,0.37872356838650173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,5120,0.7200080023871528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,3072,0.2146515581342909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,4096,0.434663110309177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,2560,0.18943022357092965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,3584,0.3798080020480686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,3072,0.3152444362640381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,65536,7.203413221571181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,7168,0.8951084348890516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,2560,0.2997235457102458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,2560,0.2790995438893636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,1536,0.11550311247507732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,1024,0.08153066370222303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,2048,0.21052800284491646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,1536,0.19299199846055773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,768,0.06544088655047946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,1536,0.16598578294118246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,1024,0.1397200028101603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,1024,0.1505191061231825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,512,0.044385777579413525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,256,0.03377244538731045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,768,0.11645600530836318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,512,0.10233689016766018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,512,0.08350577619340684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,128,0.03054844339688619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,256,0.07249599695205688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,256,0.07131022214889526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,64,0.02516711089346144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,128,0.06652177704705133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,32,0.02639377779430813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,64,0.0670293304655287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,16384,2048,0.14872177441914877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,32,0.06730666425493029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,3072,0.3334328863355849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,2048,0.23511022991604277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,16384,768,0.10332800282372369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,16384,128,0.05790399842792087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,16384,0.7912746535407172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,51200,2.7110835181342234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,16384,1.4258267084757488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,65536,3.7535616556803384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,16384,1.4716044531928167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,12288,1.0261395772298176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,12288,0.6770488950941297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,10240,0.6170390976799859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,12288,1.0824862586127388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,8192,0.5328293376498753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,10240,0.8521404266357422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,51200,5.486929575602214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,7168,0.35124799940321183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,8192,0.6908808814154731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,10240,0.8897519641452365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,6144,0.36184355947706437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,51200,4.6746033562554254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,7168,0.631223095787896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,8192,0.7889866828918457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,6144,0.5069866710238987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,5120,0.2720595465766059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,7168,0.6438382466634115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,4096,0.20976355340745714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,65536,7.099090576171875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,5120,0.42042311032613117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,3584,0.17917154894934761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,6144,0.599765353732639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,5120,0.4668453534444173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,4096,0.3637591203053792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,3072,0.15489421950446233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,4096,0.3727848794725206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,65536,6.0386301676432295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,2560,0.13164267275068495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,3584,0.30582933955722386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,3584,0.3242853217654758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,3072,0.251397344801161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,2048,0.1122337712181939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,3072,0.2808328999413384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,1536,0.0924346645673116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,2560,0.221160888671875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,2560,0.23841423458523223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,2048,0.18547466066148546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,1024,0.06954044765896268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,2048,0.20219822724660239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,1536,0.13785778151618108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,768,0.052024000220828585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,512,0.03610488772392273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,1536,0.1751013331943088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,1024,0.10350222057766384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,256,0.026543110609054565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,1024,0.12337066067589654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,768,0.10027111238903469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,128,0.023706666297382776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,512,0.08115466435750325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,512,0.0684115555551317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,64,0.020048000746303134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,256,0.059711111916436084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,256,0.06255822049246894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,12288,32,0.020100444555282593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,12288,128,0.049703111251195274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,128,0.05425777700212267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,64,0.05363377928733826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,32,0.054373333851496376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,16384,0.8436942100524902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,12288,768,0.08517244127061631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,16384,1.2440587149726021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,51200,2.6585814158121743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,16384,1.3234906726413302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,12288,0.6158764627244737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,65536,3.257523642645942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,10240,0.5025742318895128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,12288,0.9181653128729926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,12288,0.9728844960530599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,8192,0.3850408924950494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,10240,0.778165340423584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,7168,0.3477653397454156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,8192,0.5990257793002659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,51200,4.846552107069227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,10240,0.8402382002936469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,8192,0.6798764334784614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,6144,0.2834675576951769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,7168,0.585951116349962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,51200,4.2819396124945746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,5120,0.236699554655287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,7168,0.5788159900241429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,4096,0.21988177299499512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,5120,0.3795342180464003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,3584,0.14895555708143446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,4096,0.29385243521796334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,5120,0.42990843454996747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,65536,6.136631859673394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,3072,0.1383297840754191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,4096,0.45717334747314453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,3584,0.29935910966661244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,65536,5.437653435601129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,2560,0.125873777601454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,6144,0.44688087039523655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,3072,0.2661084334055583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,2048,0.10418133603201972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,2560,0.19799199369218615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,6144,0.5024986796908909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,1536,0.07789599895477295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,2048,0.1574675507015652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,1024,0.05979733334647285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,2048,0.18280177646213105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,1536,0.14924711651272243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,1536,0.12173510922325982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,768,0.042393777105543345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,1024,0.11065600315729777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,1024,0.09218311309814453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,512,0.03080000148879157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,768,0.07410044140285917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,768,0.09393599960539077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,3584,0.254984007941352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,256,0.02308622168170081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,512,0.060757332377963595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,512,0.07458400064044528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,128,0.020978666014141504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,64,0.01882222294807434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,256,0.057429333527882896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,256,0.05091555582152473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,128,0.046184000041749745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,3072,0.24548000759548613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,128,0.04698666599061754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,64,0.046959112087885536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,10240,32,0.04645955562591553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,10240,2560,0.2195368872748481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,10240,32,0.01963200006220076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,16384,0.6544062296549479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,51200,2.2236898210313583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,16384,1.0720453262329102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,65536,2.6857982211642795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,12288,0.5462906625535753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,16384,1.1791288587782118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,10240,0.4116560088263617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,10240,0.6583022011650933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,12288,0.8857679896884494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,8192,0.32138578097025555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,51200,4.084404415554471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,8192,0.5218897925482856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,10240,0.8281653192308215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,12288,0.7901440196567111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,7168,0.2799431218041314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,51200,3.7245992024739585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,6144,0.22651643223232695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,8192,0.6210026741027832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,7168,0.45604175991482204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,5120,0.18722755379147002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,65536,5.089937845865886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,7168,0.5218533409966363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,6144,0.4864640235900879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,4096,0.14571111732059056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,5120,0.33203289243910045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,3584,0.13441156016455755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,5120,0.37861333953009707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,4096,0.27762044800652397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,3072,0.11172444290584987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,4096,0.30274489190843373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,3584,0.2413110997941759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,2560,0.09595911370383368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,3584,0.2667377789815267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,2048,0.08122044139438205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,3072,0.19298222329881456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,3072,0.23867911762661406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,2560,0.16455199983384874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,1536,0.06353422005971272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,2560,0.20407022370232475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,1024,0.04438222116894192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,2048,0.136062224706014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,2048,0.17746222019195557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,768,0.034317334493001304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,1536,0.1313813394970364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,1024,0.0991555584801568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,1024,0.08157244655821058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,512,0.025103110406133864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,256,0.01947022146648831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,768,0.08354222112231785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,512,0.06785955693986681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,512,0.05319111214743721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,128,0.01699466672208574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,256,0.042098667886522084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,256,0.051876445611317955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,64,0.015977778368526034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,8192,32,0.016327111257447135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,128,0.03867644402715895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,128,0.041435556279288396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,6144,0.4640666643778483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,64,0.03810133205519782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,32,0.03794755538304647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,8192,65536,4.766833835177951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,1536,0.10788177781634861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,8192,768,0.0673804415596856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,16384,0.5092479917738173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,51200,1.8793413374159071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,65536,2.2547147538926864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,12288,0.4662586847941081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,16384,1.0322080188327365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,10240,0.3317191070980496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,16384,1.1220009062025282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,12288,0.7594435479905871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,8192,0.2798115677303738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,12288,0.8989404042561849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,10240,0.667334238688151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,10240,0.7028320100572375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,7168,0.23368710941738555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,8192,0.5788826412624782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,51200,3.782600826687283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,6144,0.19987289110819498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,8192,0.5681386523776585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,6144,0.37873156865437824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,7168,0.5425644450717503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,65536,4.681751251220703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,6144,0.4419902165730794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,51200,3.5076043870713978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,5120,0.3081555631425646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,3584,0.1158248848385281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,5120,0.37117422951592344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,4096,0.23857421345180937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,3072,0.09727999899122451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,4096,0.29132265514797634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,65536,4.526322682698567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,3584,0.20806754959954155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,3584,0.25525156656901044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,3072,0.17989510960049102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,3072,0.22141599655151367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,2560,0.1531368891398112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,2048,0.06623644298977323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,2560,0.18905956215328643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,1536,0.055148445897632174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,5120,0.17972444163428414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,2048,0.12645422087775335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,2048,0.1563768916659885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,1024,0.03787644373046027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,1536,0.09934400187598334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,4096,0.12821422682868108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,1024,0.0951404439078437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,1024,0.07512178023656209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,512,0.021746666895018682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,768,0.06016266345977783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,768,0.07987733019722833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,256,0.016899555921554565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,512,0.04857422245873345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,512,0.0645457771089342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,128,0.01516533394654592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,256,0.03814933366245694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,256,0.04958044489224752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,64,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,32,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,128,0.04000711109903123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,128,0.034324444002575345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,64,0.03399644295374552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,2560,0.08833155367109512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,32,0.03370133373472426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,7168,7168,0.4271217717064752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,7168,1536,0.1255440049701267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,16384,0.47927199469672305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,51200,1.6938728756374781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,7168,768,0.028710222906536523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,16384,0.9206008911132812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,12288,0.38311465581258136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,12288,0.6682986683315701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,16384,1.0658790800306532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,65536,1.9895119137234156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,10240,0.2840382258097331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,12288,0.8055502043830024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,8192,0.23459198739793566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,10240,0.5619849099053277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,8192,0.44747469160291886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,7168,0.20043555895487467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,10240,0.6570035616556803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,51200,3.254357231987847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,6144,0.18284889062245688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,8192,0.5849226845635308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,65536,4.312975141737196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,7168,0.39165332582261825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,5120,0.14910666147867838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,6144,0.33879023128085667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,7168,0.4890631039937337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,4096,0.12069777647654216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,5120,0.30523289574517143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,51200,3.328203625149197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,3584,0.10074222087860107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,6144,0.40639734268188477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,5120,0.3415857685936822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,4096,0.22063199679056802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,3072,0.0828897754351298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,65536,4.14029057820638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,2560,0.07732622490988837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,4096,0.2738453282250298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,3584,0.19585243860880533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,3072,0.16427111625671387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,3584,0.23802312215169272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,2048,0.06497333447138469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,3072,0.20681599775950113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,2560,0.15217599603864881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,1536,0.04791999856630961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,2560,0.17664978239271376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,1024,0.03143111202451918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,2048,0.11956532796223958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,768,0.025063999825053748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,2048,0.14743555916680232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,1536,0.11809689468807644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,1536,0.09256266885333592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,512,0.018681777848137748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,1024,0.08948622147242229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,256,0.01441511180665758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,768,0.08058666520648532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,768,0.05567555295096504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,128,0.012732444538010491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,512,0.043354666895336576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,256,0.04680000080002678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,64,0.011043555206722684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,256,0.034246222840415105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,6144,32,0.01108888867828581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,128,0.0366960002316369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,128,0.03084355592727661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,64,0.030834668212466772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,32,0.03013777732849121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,6144,1024,0.06867644521925184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,6144,512,0.059975114133622914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,51200,1.3701697455512152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,16384,0.40966044531928164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,65536,1.7832923465304906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,12288,0.3070853286319309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,16384,0.8278995619879829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,10240,0.25633690092298717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,12288,0.6843040254380969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,12288,0.7895991007486979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,10240,0.5386995739407009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,8192,0.20742311742570665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,51200,2.87189949883355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,10240,0.6363209088643392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,7168,0.18157866266038683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,8192,0.4152008957333035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,6144,0.1524488925933838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,8192,0.5146133104960123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,65536,3.6705440945095487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,7168,0.3597742186652289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,7168,0.45395554436577695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,5120,0.1266604397031996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,4096,0.10405333174599542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,6144,0.31898310449388295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,16384,1.0128675036960177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,5120,0.2570364475250244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,6144,0.38860177993774414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,3584,0.09401600228415595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,5120,0.32728621694776744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,3072,0.07515377468532987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,4096,0.20549244350857207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,51200,3.09700436062283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,4096,0.26181689898173016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,2560,0.062160889307657875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,3584,0.22802223099602592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,2048,0.054027554061677724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,65536,3.974389394124349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,3072,0.15050666862063938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,3072,0.19811556074354383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,1536,0.038872000243928694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,2560,0.1282364394929674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,2560,0.16916799545288086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,1024,0.026932444837358262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,2048,0.1405093272527059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,768,0.02163911031352149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,2048,0.10650755299462213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,512,0.01719111038578881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,1024,0.06246755520502726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,768,0.07163555754555596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,768,0.05004533463054233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,256,0.01400888959566752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,512,0.03927822245491876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,512,0.057486222849951855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,128,0.01180622229973475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,256,0.03070844544304742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,64,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,128,0.033583111233181424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,5120,32,0.013168888787428537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,64,0.027746667464574177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,32,0.02718222141265869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,3584,0.1745955546696981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,1536,0.08416089084413315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,1024,0.08497422271304661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,256,0.04361866580115425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,5120,128,0.02814133299721612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,65536,1.3569751315646703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,16384,0.34644267294141984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,51200,1.0996239980061848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,5120,1536,0.11293866899278428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,12288,0.2889084551069471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,16384,0.7678506639268664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,12288,0.5565146870083278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,16384,0.9363715913560656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,10240,0.2133315536710951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,12288,0.697898652818468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,10240,0.46698665618896484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,8192,0.18088089095221627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,51200,2.589459525214301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,65536,3.2881974114312063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,7168,0.14708533551957872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,10240,0.6087013350592719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,8192,0.3751777807871501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,6144,0.13313778241475424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,8192,0.47684446970621747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,7168,0.3322293228573269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,5120,0.11036177476247151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,7168,0.41786400477091473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,4096,0.08840888738632202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,6144,0.3646266725328233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,51200,2.8569920857747397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,5120,0.23670487933688691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,65536,3.640816158718533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,3584,0.07896444532606336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,5120,0.30312977896796334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,3072,0.06917688581678602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,4096,0.18492444356282553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,3584,0.15936888588799372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,2560,0.053456889258490674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,3584,0.21134844091203478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,3072,0.13631021976470947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,2048,0.045336888896094434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,3072,0.18280977673000762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,2560,0.11532444424099392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,1536,0.0370506677362654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,2560,0.156713777118259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,1024,0.026368000441127356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,2048,0.0951039989789327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,2048,0.13025244077046713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,768,0.018945778409639995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,1536,0.10453333457310994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,1536,0.07609511084026761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,512,0.01663822266790602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,1024,0.07882577843136258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,768,0.04467466804716322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,768,0.06640977991951837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,6144,0.283644437789917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,256,0.012703110774358114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,512,0.034837332036760114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,512,0.05268355541759067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,128,0.009338666995366415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,64,0.00832266691658232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,256,0.04008888867166307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,256,0.02721066607369317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,128,0.0328800015979343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,128,0.025047999289300706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,64,0.024719999896155462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,32,0.02416177756256527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,4096,4096,0.24154400825500488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,4096,1024,0.05533866749869453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,65536,1.0328559875488281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,51200,0.9077964358859592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,16384,0.2911289003160265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,4096,32,0.008285333712895712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,12288,0.20495911439259848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,12288,0.5264879862467448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,16384,0.7851422097947863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,10240,0.17079199684990776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,16384,0.9100515577528211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,12288,0.7071697976854113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,10240,0.4425048828125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,8192,0.14986666043599448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,51200,2.333422131008572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,7168,0.12707822852664524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,8192,0.35787200927734375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,10240,0.5825191073947483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,6144,0.10502666897243923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,7168,0.3126764562394884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,8192,0.45506042904324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,65536,3.0103734334309897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,5120,0.08955466747283936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,7168,0.4183431201510959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,6144,0.2708622349633111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,4096,0.06751555866665311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,51200,2.7282223171657987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,6144,0.3477733400132921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,5120,0.22308267487419975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,3072,0.04629955689112345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,4096,0.17605866326226127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,5120,0.2909031179216173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,4096,0.23202488157484266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,2560,0.04451555675930447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,3584,0.15144177277882895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,3584,0.20297777652740479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,2048,0.0329075555006663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,3072,0.12981866465674505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,3072,0.1756524509853787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,2560,0.11026310920715332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,2560,0.1500951051712036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,1024,0.020294222566816542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,2048,0.09035999907387628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,2048,0.1250213384628296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,1536,0.07247022125456068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,65536,3.4865165286593967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,1536,0.10092000166575114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,768,0.016044444508022733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,1024,0.05248444279034933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,512,0.012480888929631976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,1024,0.07626044750213623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,256,0.009694221946928237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,768,0.06413955820931329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,768,0.041045334604051374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,512,0.05006400081846449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,128,0.008667555948098501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,512,0.0329715543323093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,64,0.008039111064540016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,256,0.04189599884880913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,256,0.025478222303920325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,32,0.008006222546100616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3584,128,0.03223111232121786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,128,0.023590222001075745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,64,0.022652443912294176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3584,32,0.022636445032225713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,1536,0.02896266513400608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,51200,0.7397217750549316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,65536,1.0282586415608723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,16384,0.2649466726515028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3584,3584,0.058435552650027804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,12288,0.19314844078487822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,16384,0.7103048960367838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,12288,0.49721066157023114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,16384,0.8691786660088433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,51200,2.161937713623047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,10240,0.16249956025017634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,8192,0.13651288880242243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,12288,0.6528755293952094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,10240,0.42098222838507754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,8192,0.33717955483330625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,65536,2.7806426154242625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,10240,0.5390986866421169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,6144,0.09534311294555664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,8192,0.43630043665568036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,7168,0.29679732852511936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,5120,0.08267555634180705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,7168,0.38429689407348633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,6144,0.2555430995093452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,6144,0.33245955573187935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,4096,0.06776266627841525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,51200,2.6013946533203125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,5120,0.21260889371236166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,3584,0.05665600299835205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,5120,0.2786960071987576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,3072,0.04837422238455879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,4096,0.1665804386138916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,65536,3.3296142154269748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,2560,0.04075466593106588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,4096,0.2213697830835978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,3584,0.14432444837358263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,3584,0.19396089182959664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,2048,0.03564622335963779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,3072,0.12372177177005345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,1536,0.023178666830062866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,2560,0.1435733371310764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,2560,0.10428088903427124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,7168,0.11853867106967503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,2048,0.08596533536911011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,1536,0.09576088852352566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,1536,0.06561777989069621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,1024,0.07324000199635823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,512,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,768,0.03958400090535482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,512,0.031114667654037476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,512,0.04821244544453091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,256,0.009104889300134447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,256,0.03861600160598755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,128,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,128,0.021713778376579285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,3072,0.16833599408467612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,128,0.031161778502994116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,64,0.007249777515729268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,32,0.00738844441043006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,2048,0.1197119951248169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,64,0.02093066606256697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,32,0.021274665991465252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,1024,0.04910755488607618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,3072,768,0.06169688701629639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,3072,256,0.023761777414215937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,65536,0.852319982316759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,51200,0.6799253357781304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,16384,0.25049956639607746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,1024,0.017303999927308824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,3072,768,0.014630221658282809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,12288,0.1595404413011339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,16384,0.6930195490519205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,10240,0.13431733184390598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,12288,0.47052801979912656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,12288,0.6374390920003256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,16384,0.8986657460530599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,51200,2.014613257514106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,10240,0.40273332595825195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,8192,0.10807644658618504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,7168,0.09676977660920884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,10240,0.535229312049018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,8192,0.3209351168738471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,65536,2.584857728746202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,6144,0.07550577984915839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,8192,0.43351022402445477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,5120,0.0689493351512485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,7168,0.3814551035563151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,6144,0.24154223336113823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,4096,0.0495306650797526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,6144,0.3304275671641032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,5120,0.2013111114501953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,3584,0.04361688759591845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,5120,0.27709688080681694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,4096,0.15784266259935167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,3072,0.03603200117746989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,51200,2.586226569281684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,4096,0.21928532918294272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,2560,0.03334844443533156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,3584,0.13670399453904894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,3584,0.1930088864432441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,65536,3.312351014879015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,2048,0.028360890017615423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,3072,0.11741956075032552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,3072,0.16700266467200386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,1536,0.021528000632921856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,2560,0.09856266445583767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,2560,0.14283822642432317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,1024,0.015505777464972602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,2048,0.08034933275646634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,2048,0.11827199988894993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,768,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,1536,0.06139289008246528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,1536,0.09473333093855117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,512,0.010334221853150262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,7168,0.2821733421749539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,1024,0.07197688685523139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,256,0.00795999997191959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,128,0.007276444799370236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,768,0.060025778081681996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,512,0.046781334612104625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,512,0.028561777538723413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,256,0.03685333331425985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,64,0.006577777779764599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,256,0.022665777140193518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2560,32,0.006624889042642381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2560,128,0.029106666644414265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,128,0.020237333244747586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,64,0.019555555449591745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,32,0.019558222757445443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,51200,0.5169884363810221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,65536,0.6555164655049642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,16384,0.18688978089226616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,1024,0.045828445090187915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2560,768,0.03701333204905192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,12288,0.12402489450242783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,16384,0.6443164613511827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,10240,0.10603555705812241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,12288,0.44319465425279403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,16384,0.852693345811632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,12288,0.6112177636888292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,8192,0.09162400166193645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,10240,0.37402044402228457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,51200,1.8592294057210286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,7168,0.07467289103402032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,10240,0.5125964482625326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,8192,0.30133154657151967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,6144,0.07150133450826009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,7168,0.26524445745680064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,65536,2.368481742011176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,8192,0.4190479914347331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,5120,0.05241866575347053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,4096,0.04265066650178698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,7168,0.3657253318362766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,6144,0.22798222965664336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,3584,0.03784711162249247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,5120,0.18927644358740914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,6144,0.3167822096082899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,51200,2.474940405951606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,5120,0.26445778210957843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,3072,0.03408799899948968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,4096,0.20978755421108672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,2560,0.029157333903842505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,3584,0.12807555993398032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,3584,0.18410844273037383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,2048,0.024478221933046978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,3072,0.10991822348700629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,3072,0.15944266319274902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,1536,0.019718221492237516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,2560,0.1371413336859809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,1024,0.015180443723996481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,2048,0.07506577836142646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,1536,0.05720444520314535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,1536,0.09114578035142686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,65536,3.157853232489692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,768,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,1024,0.04109244545300802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,1024,0.06787644492255317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,768,0.03508266806602478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,768,0.05645155244403415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,512,0.026740445031060114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,256,0.007258666886223688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,256,0.03559733430544535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,256,0.021176000436147053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,128,0.0069573331210348345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,128,0.018922666708628338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,128,0.028780443800820246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,4096,0.14802311526404485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,32,0.006233777850866318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,64,0.018188445104493033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,32,0.017878222796652053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,2048,2560,0.09222933318879868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,2048,0.11396711402469212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,512,0.009365333451165093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,65536,0.5021226671006944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,2048,512,0.045200887653562755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,51200,0.3785884380340576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,16384,0.12139733632405598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,2048,64,0.007260444263617198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,12288,0.09587466716766357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,16384,0.5654595692952474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,16384,0.7686497900221082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,12288,0.4170728789435492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,10240,0.08487466971079509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,12288,0.5866364373101128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,8192,0.06439199712541369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,10240,0.3497955534193251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,51200,1.7214426464504664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,7168,0.05584355857637194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,65536,2.1928738488091364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,10240,0.48921600977579754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,8192,0.2834800084431966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,6144,0.047136889563666455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,5120,0.041061331828435264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,7168,0.24926487604777017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,6144,0.21453689204321968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,7168,0.34862221611870664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,6144,0.3022720019022624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,5120,0.17767732673221162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,3584,0.026698667142126296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,5120,0.25225332048204213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,4096,0.13897511694166395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,51200,2.353758282131619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,4096,0.19952444235483804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,3072,0.02476799984773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,2560,0.020695999264717102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,3584,0.1755208836661445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,65536,3.0001519521077475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,3072,0.10304711262385051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,3072,0.15198577774895564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,2048,0.017080000705189176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,2560,0.08643200000127156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,1536,0.013632888595263163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,2560,0.1307351059383816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,1024,0.010226666927337646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,2048,0.07221421930525038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,1536,0.05556888712777031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,1536,0.0869342221154107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,768,0.00867555538813273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,1024,0.03804088963402642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,1024,0.06402133570777045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,8192,0.39593866136338973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,768,0.054049776660071484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,256,0.005912888795137405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,512,0.025461332665549383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,512,0.04314400090111626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,4096,0.03085422184732225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,128,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,256,0.019561777512232464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,256,0.034239110019471906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,64,0.004876444323195351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,128,0.027445332871543035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,128,0.01722666621208191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,32,0.004914666629499859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,64,0.016746666696336534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,32,0.016537777251667447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,3584,0.12044978141784668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,65536,0.34563732147216797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,51200,0.2857902314927843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1536,2048,0.10879022545284694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,16384,0.0967644453048706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1536,512,0.006979555719428592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1536,768,0.031939556201299034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,12288,0.06589955753750272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,16384,0.5193191104465061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,10240,0.058824890189700656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,12288,0.39187555842929417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,16384,0.7484764522976346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,12288,0.5548639827304417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,10240,0.33002487818400067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,51200,1.5990542305840387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,8192,0.26619111167060006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,10240,0.4648444387647841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,7168,0.03926488757133484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,6144,0.03540800015131632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,65536,2.0404514736599393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,8192,0.3768311076694065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,7168,0.23377956284417045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,5120,0.029672000143263075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,6144,0.20182577768961588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,7168,0.33199644088745117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,4096,0.02459022237194909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,6144,0.28739645746019155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,5120,0.16758844587537977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,5120,0.24008001221550834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,3584,0.022058667408095464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,4096,0.1310302284028795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,51200,2.2340195973714194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,3072,0.01941244469748603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,8192,0.04706666535801358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,2560,0.01676177812947167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,3584,0.11311199929979111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,3584,0.16751555601755777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,2048,0.014392000105645923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,3072,0.09597155782911514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,3072,0.14458844396803114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,65536,2.8544765048556857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,2560,0.08086044258541532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,2560,0.12348711490631104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,1024,0.00964355551534229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,2048,0.06698133548100789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,2048,0.10354222191704644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,768,0.008614222208658854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,1536,0.08260266648398505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,1536,0.050966223080952965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,512,0.0069226668112807805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,1024,0.035767998960283064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,1024,0.06037066380182902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,256,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,768,0.029489778810077246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,512,0.04107022285461426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,128,0.005230222311284807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,256,0.03223199976815118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,128,0.01578044394652049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,128,0.026366222235891554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,64,0.00453244439429707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,32,0.004864000197913912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,4096,0.19008178181118437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,64,0.015209777487648858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,32,0.01478666729397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,65536,0.25750578774346244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,1024,1536,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,51200,0.205932444996304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,16384,0.0628346668349372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,512,0.023959111836221483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,1024,256,0.017663111289342243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,12288,0.048751999934514366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,16384,0.4988000128004286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,12288,0.3775555557674832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,10240,0.04154488775465224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,16384,0.729672008090549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,51200,1.5371715757581923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,12288,0.5527937677171495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,10240,0.316793786154853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,1024,768,0.05135111014048258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,8192,0.03407466742727492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,65536,1.9637902577718098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,7168,0.029994666576385498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,6144,0.025314667158656653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,10240,0.46445597542656797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,8192,0.2559457884894477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,7168,0.22511466344197592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,5120,0.02053777707947625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,6144,0.1937342219882541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,8192,0.37584887610541445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,7168,0.3306159973144531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,4096,0.017129777206314933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,3584,0.015159999330838522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,6144,0.28677333725823295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,5120,0.1606231133143107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,5120,0.2395519945356581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,4096,0.1260639958911472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,4096,0.18948533799913195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,3584,0.10766666465335423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,3584,0.16695288817087808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,2560,0.012433778080675336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,2048,0.010038221875826517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,51200,2.223896026611328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,3072,0.14408444033728704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,1536,0.008929777476522658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,65536,2.843176947699653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,2560,0.07717688878377278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,2560,0.1234640015496148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,1024,0.0069848886794514125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,2048,0.06333511405520968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,2048,0.10201155477099949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,1536,0.047835555341508657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,1536,0.08239110973146227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,1024,0.03417422374089559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,1024,0.060461335712009005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,512,0.005201777650250329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,256,0.004464888738261329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,768,0.02844888965288798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,768,0.050739556550979614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,128,0.0041742221348815495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,512,0.041109333435694374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,512,0.022801778382725183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,256,0.01720888912677765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,256,0.032347556617524885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,32,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,768,128,0.02604088849491543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,128,0.014893333117167154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,64,0.014492443866199918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,32,0.014165333575672574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,65536,0.1962613397174411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,3072,0.013794666363133324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,51200,0.16158844365013972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,768,3072,0.09201511409547593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,16384,0.05184177888764275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,768,0.006215999937719769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,768,64,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,16384,0.48671823077731663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,12288,0.03881866733233134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,16384,0.6919591161939832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,10240,0.033033778270085655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,12288,0.36841511726379395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,12288,0.525268448723687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,51200,1.4919644461737738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,8192,0.0255395554833942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,10240,0.3089280128479004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,65536,1.906338585747613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,7168,0.02176977859603034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,10240,0.4398870997958713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,8192,0.24964978959825304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,6144,0.01962844365172916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,8192,0.3573102156321208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,7168,0.21940355830722383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,5120,0.016543111867374845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,7168,0.3145475652482775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,6144,0.18927644358740914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,4096,0.013750221994188098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,51200,2.118704054090712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,6144,0.27233510547214085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,5120,0.1569111082288954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,5120,0.22849067052205405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,3072,0.011657777759763928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,4096,0.12248533301883274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,4096,0.18005777729882133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,2560,0.010050666828950247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,65536,2.6959590911865234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,3584,0.15824800067477757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,2048,0.008961777720186446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,3072,0.08996799919340347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,3072,0.1373280021879408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,1536,0.007619555625650618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,2560,0.07514578104019165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,2560,0.11714400185479058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,1024,0.006231110956933763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,2048,0.09739822149276733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,2048,0.061647110515170626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,1536,0.07756977611117892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,1536,0.04615911179118686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,512,0.004912888838185204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,1024,0.03316888875431485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,1024,0.05742310815387302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,256,0.0041848888827694785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,768,0.027608889672491286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,768,0.04876888791720072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,128,0.00424177779091729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,256,0.030942221482594807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,128,0.014191110928853353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,64,0.0041742221348815495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,128,0.02462933295302921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,32,0.004242666479614046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,3584,0.012487110992272695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,32,0.01352355546421475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,65536,0.1181902223163181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,3584,0.10515999794006348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,51200,0.09242310788896348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,512,768,0.005550222264395819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,512,512,0.03934489025010003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,256,0.016523554921150208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,16384,0.0373342235883077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,64,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,12288,0.027688889039887324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,16384,0.4676622284783258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,16384,0.6863155364990234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,10240,0.021190222766664293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,12288,0.3538044558631049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,51200,1.4325244691636827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,8192,0.01749955614407857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,65536,1.8277626037597656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,12288,0.5213724242316352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,512,512,0.02196088929971059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,7168,0.01533600025706821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,8192,0.23979110187954375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,10240,0.43828267521328396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,6144,0.013506666653686099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,7168,0.2106728951136271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,8192,0.3540693389044867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,5120,0.011970666547616323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,7168,0.3125564522213406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,6144,0.18138933181762695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,4096,0.010328888893127441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,6144,0.2703893449571398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,5120,0.15051733122931585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,51200,2.097135967678494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,3584,0.009700444837411245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,3072,0.008357333640257517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,5120,0.22650310728285047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,4096,0.11763021681043838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,65536,2.678693347507053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,2560,0.007670222057236566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,3584,0.10028888781865437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,3584,0.15695644749535456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,3072,0.0853031078974406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,2048,0.006697777658700943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,3072,0.13558222187889948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,1536,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,2560,0.0718053314420912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,2560,0.11622222264607747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,2048,0.058303111129336886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,2048,0.09621244668960571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,1024,0.00490488898422983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,768,0.004576888763242298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,1536,0.04375822345415751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,1536,0.07688177956475152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,512,0.0041884444653987885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,1024,0.05682222048441569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,768,0.02638133366902669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,768,0.048271109660466514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,256,0.0034942221310403612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,512,0.03866044349140591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,512,0.020976000361972388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,128,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,256,0.03047377864519755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,256,0.015673778123325773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,64,0.003142222141226133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,256,32,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,128,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,128,0.024396444360415142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,64,0.012832000023788877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,65536,0.09069066577487522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,32,0.0127697777416971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,51200,0.07184800174501207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,256,4096,0.17862399419148764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,16384,0.029488000604841445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,10240,0.2963742150200738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,256,1024,0.03149866726663377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,16384,0.4570159912109375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,12288,0.020283554991086323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,12288,0.3456888993581136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,10240,0.016075554821226332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,12288,0.5201946894327799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,16384,0.6847902403937446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,51200,1.3980151282416449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,8192,0.013356444736321768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,10240,0.2902195453643799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,65536,1.7904586791992188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,7168,0.012087999946541257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,6144,0.010885333021481832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,8192,0.23404354519314238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,10240,0.43703556060791016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,8192,0.3527795473734538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,7168,0.20590133137173125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,5120,0.009349333743254343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,4096,0.00795288880666097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,6144,0.17740355597601998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,7168,0.31199465857611763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,3584,0.007607999775144789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,51200,2.0925706227620444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,6144,0.2696933216518826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,5120,0.14716355005900064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,3072,0.006736889067623351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,5120,0.22572623358832467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,4096,0.11492978201972114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,4096,0.17887022760179308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,2560,0.00628977765639623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,3584,0.0985777775446574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,2048,0.005584888988071018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,3584,0.15642666816711426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,3072,0.0832479993502299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,3072,0.1350275543000963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,2560,0.06974844137827556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,1536,0.005153777698675792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,2560,0.11579644680023193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,1024,0.004179555508825514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,65536,2.674082650078667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,2048,0.0961502194404602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,2048,0.0568737785021464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,512,0.0036231109665499795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,1536,0.07585599687364367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,1024,0.030745777818891738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,256,0.003343111111058129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,768,0.047657777865727745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,512,0.03832799858517117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,128,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,256,0.02933244572745429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,128,0.0129439996348487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,128,0.023688889212078516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,64,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,32,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,64,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,32,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,65536,0.08628977669609918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,51200,0.06844621896743774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,128,768,0.0038746665749284956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,1536,0.04263733492957222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3840,128,1024,0.0563102232085334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,768,0.025721778472264607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,12288,0.01646399994691213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,512,0.02035999960369534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,10240,0.015855110353893705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,128,256,0.014904000692897372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,8192,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,16384,0.4567226833767361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,12288,0.34516178237067324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,7168,0.011372444530328115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,10240,0.2902639971839057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,6144,0.01038577738735411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,8192,0.2337475617726644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,5120,0.008990222381220924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,4096,0.00796888851457172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,7168,0.20586578051249185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,6144,0.177328003777398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,5120,0.14720800187852648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,3584,0.0073315559162033936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,3072,0.006595555692911148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,4096,0.11477422714233398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,2560,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,2048,0.005559999909665849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,3584,0.09809777471754287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,3072,0.0827617777718438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,16384,0.0281315545241038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,1536,0.004584889031118817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,65536,1.7875226338704426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,1024,0.004212444441186057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,2048,0.0561351113849216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,768,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,512,0.003567999849716822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,256,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,1536,0.04198666744761997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,1024,0.030581331915325586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,128,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,768,0.025425778494940862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,512,0.020242666204770405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,64,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,64,32,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,256,0.014818666709793938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,128,0.01275199982855055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,64,0.012063110868136087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,32,0.0121742222044203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,51200,0.06738222307629056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,12288,0.014085332552591959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,16384,0.45679733488294816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,51200,1.3988151550292969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,12288,0.3451697826385498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,10240,0.011653333074516721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,8192,0.0103502223889033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,7168,0.010015111002657149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,64,2560,0.06993155346976386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,6144,0.009034666750166152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,10240,0.28944622145758736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,8192,0.2343662314944797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,7168,0.20560533470577666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,4096,0.00999466660949919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,6144,0.17719466156429717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,65536,0.08533244662814671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,3584,0.008640888664457533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,3072,0.007666666474607255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,5120,0.14715645048353407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,16384,0.025773333178626165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,2560,0.007374222079912822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,4096,0.1142444478140937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,2048,0.005222222043408289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,51200,1.3997333314683702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,1536,0.004883555488453971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,3584,0.09839200311236912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,1024,0.0042053332759274375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,3072,0.08314844634797838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,768,0.003583999971548716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,512,0.003228444399105178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,2048,0.05715466870201958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,1536,0.04261777798334757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,256,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,1024,0.030477331744299993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,128,0.0028453332682450614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,768,0.025715554753939312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,64,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,512,0.020237333244747586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,32,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,256,0.014853333433469137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,128,0.012736000120639801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,64,0.012412444584899478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,32,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3840,32,5120,0.011395555403497485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,2560,0.06987733311123319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3840,32,65536,1.787865744696723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,12288,3.278843561808268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,10240,3.021664089626736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,16384,4.3080567253960504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,10240,3.228988435533312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,12288,3.921143001980252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,16384,5.416568756103516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,8192,2.2463982899983725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,6144,1.749595536126031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,7168,2.022038141886393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,8192,2.4693963792588973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,7168,2.155184851752387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,5120,1.4695946375528972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,6144,1.8452311621771917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,4096,1.1727111604478624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,3584,1.0048675537109375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,4096,1.1931155522664387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,5120,1.5746328565809462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,3584,1.0490088992648654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,2560,0.767540454864502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,3072,0.8658302095201281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,3072,0.9423600302802192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,2560,0.7859413358900281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,1536,0.4585217899746365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,2048,0.544322649637858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,1024,0.3197297785017225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,1536,0.49954313702053493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,2048,0.6994969050089518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,768,0.24938223097059461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,512,0.18004977703094482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,256,0.13457866509755453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,1024,0.4223208957248264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,768,0.40519732899136013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,512,0.25517598787943524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,128,0.11418222056494819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,64,0.11454933219485813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,256,0.22403377956814238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,32,0.0929573310746087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,128,0.2138204442130195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,64,0.21373066637251112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,32,0.2258737881978353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,65536,51200,13.668641832139757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,16384,3.4566355811225047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,16384,4.397928025987413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,12288,2.886912875705295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,12288,3.0799403720431857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,10240,2.427212397257487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,8192,2.043797387017144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,8192,2.016996383666992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,10240,2.5816194746229386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,7168,1.677608913845486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,51200,10.804812961154513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,6144,1.4904951519436305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,7168,1.7229039933946397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,5120,1.1866657469007704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,4096,0.8571804364522299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,5120,1.2505253685845268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,6144,1.4539111455281575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,3584,0.7777866787380643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,3072,0.658608012729221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,65536,51200,23.408447265625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,3584,0.8424942228529188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,4096,0.9737058215671115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,2560,0.6008684370252821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,2048,0.41091288460625547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,65536,13.837848239474825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,3072,0.7568924691942004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,2560,0.6461057662963867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,1024,0.2623644404941135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,1536,0.3827368948194716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,768,0.18206489086151123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,2048,0.5024319754706489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,1024,0.3006257745954725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,1536,0.42884355121188694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,512,0.14939199553595647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,256,0.09176888730790879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,128,0.08181244134902954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,64,0.07401155763202243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,256,0.1777448919084337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,51200,32,0.07852977514266968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,128,0.18443289068010119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,512,0.2007217804590861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,64,0.17073867056104872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,768,0.2592239909701877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,32,0.17116088337368437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,16384,1.145857810974121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,16384,1.6482666863335504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,12288,0.8650737868414985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,10240,0.7510373327467176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,51200,18.02996826171875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,12288,1.1938098271687825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,51200,3.570929633246528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,8192,0.6023475329081217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,8192,0.7812159856160482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,7168,0.5416906674702963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,65536,4.481685214572482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,6144,0.3895955615573459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,5120,0.38137155108981663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,7168,0.7276026407877604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,6144,0.6972328821818033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,5120,0.5058702362908257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,4096,0.30330223507351345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,3584,0.25670311186048717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,10240,1.0382649103800456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,4096,0.38019111421373153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,3072,0.21952533721923828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,3584,0.3334453370836046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,2560,0.18517066372765434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,2048,0.1390897830327352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,3072,0.33968178431193036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,1536,0.11610933144887288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,2560,0.24224978023105195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,1024,0.08163111077414618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,768,0.06068266762627495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,2048,0.20029155413309732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,1536,0.16913421948750815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,512,0.04683466752370199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,256,0.03394577900568644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,768,0.09582577811347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,512,0.0841111143430074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,128,0.03099200129508972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,256,0.06774755318959554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,128,0.06426399946212769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,32,0.02596355477968852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,64,0.06405511167314318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,51200,6.839948442247178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,32,0.06532266404893664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,1024,0.12237155437469482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,51200,65536,22.55080837673611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,16384,64,0.02688177757793003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,16384,65536,8.230125427246094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,16384,0.8936568366156684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,12288,0.6232293446858724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,16384,1.320566177368164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,10240,0.5059786902533637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,51200,2.5228008694118924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,8192,0.38567201296488446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,12288,0.9896755218505859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,7168,0.3820622232225206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,65536,3.2419022454155813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,8192,0.6672168837653266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,10240,0.8789608743455676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,6144,0.3561324543423123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,4096,0.2112711138195462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,7168,0.5735991266038682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,5120,0.27541155285305446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,6144,0.5309066772460938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,5120,0.3982275591956244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,3072,0.16589421696133083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,4096,0.3560568756527371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,2560,0.1361075507269965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,3584,0.272183100382487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,2048,0.1090631087621053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,1536,0.09061244461271499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,3072,0.2401768896314833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,2560,0.20621955394744873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,1024,0.05891911188761393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,768,0.04771733283996582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,2048,0.16387111610836452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,1536,0.13527111212412515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,512,0.03587377733654446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,256,0.028209778997633193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,1024,0.10049155685636733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,768,0.07947555515501234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,512,0.06560711065928142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,64,0.019348444210158456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,256,0.0557253360748291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,32,0.01938311093383365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,128,0.022915555371178523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,128,0.051669332716200084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,64,0.05159911182191637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,32,0.05263555712170071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,12288,3584,0.17878222465515137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,16384,0.6932266553243002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,51200,5.236785888671875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,12288,0.5621075630187988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,16384,1.158373302883572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,10240,0.4383991029527452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,12288,0.8828017976548937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,51200,2.227404488457574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,10240,0.7060506608751086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,8192,0.35848177803887266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,12288,65536,6.906035529242621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,7168,0.34764356083340114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,6144,0.28794754876030815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,65536,2.862614313761393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,8192,0.5670826699998643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,5120,0.25433243645562065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,7168,0.4914248784383138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,6144,0.4650755458407932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,4096,0.20503555403815377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,3072,0.1442693339453803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,3584,0.18201333946651885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,5120,0.4187608824835883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,3584,0.23932088745964897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,2560,0.11616533332400852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,2048,0.1048320002026028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,1536,0.07758933305740356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,3072,0.23738132582770455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,1024,0.0516844458050198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,2560,0.22838134235805937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,2048,0.14565600289238825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,1536,0.11768444379170735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,512,0.031854222218195595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,1024,0.09018311235639785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,256,0.023391111029518977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,768,0.07370577918158637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,128,0.018900444110234577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,512,0.058371557129753955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,64,0.016220443778567843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,256,0.05005155669318306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,32,0.016837333639462788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,128,0.04555288950602213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,64,0.044403556320402354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,32,0.04435999857054817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,51200,4.589792887369792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,4096,0.275673786799113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,10240,768,0.0418524444103241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,16384,0.5860017670525445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,10240,65536,5.741522471110026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,12288,0.4744266404045953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,16384,1.0085022184583876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,51200,1.930940416124132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,10240,0.3646808995140924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,8192,0.3180035485161675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,65536,2.5220559438069663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,12288,0.7636995315551758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,10240,0.6212008794148763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,7168,0.2971786657969157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,6144,0.23205065727233887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,8192,0.5360453393724229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,4096,0.1592737833658854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,5120,0.20537955231136748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,7168,0.47371557023790145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,3584,0.12752177980211046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,6144,0.372126234902276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,4096,0.24498399098714194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,3072,0.11097688807381524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,2560,0.10159289174609715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,2048,0.07545333438449435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,3584,0.24804266293843588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,1536,0.058205333020952016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,3072,0.1836613284216987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,2560,0.15654399659898546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,1024,0.041125333971447416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,768,0.03455911080042521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,2048,0.12828177875942653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,512,0.025458667013380263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,1536,0.10434310966067845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,256,0.01975022256374359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,1024,0.07706489165623982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,768,0.062330669826931424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,128,0.015770667129092746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,64,0.013344888885815939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,512,0.04975822236802843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,8192,32,0.013428444663683573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,256,0.04110844598876105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,128,0.036701334847344294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,64,0.03599822190072801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,32,0.03496711121665107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,5120,0.3201528920067681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,16384,0.4748400052388509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,51200,4.014532301161024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,12288,0.3625315560234918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,8192,65536,4.95290035671658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,10240,0.30949245558844674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,51200,1.4816800223456488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,16384,0.9291359583536783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,12288,0.7131519847446017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,8192,0.2552684413062202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,7168,0.21483377615610758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,10240,0.6022791332668728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,65536,2.0293511284722223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,6144,0.22135021951463488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,5120,0.16403644614749485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,7168,0.4062497880723741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,8192,0.48672978083292645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,4096,0.15101333459218344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,3584,0.12219199869367812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,6144,0.3651119867960612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,4096,0.24038044611612955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,5120,0.3085537751515706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,2560,0.08073155747519599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,3584,0.19717244307200113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,2048,0.06623911195331149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,1536,0.051473776499430336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,3072,0.17305244339836967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,1024,0.03440622157520718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,768,0.0270453327231937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,2048,0.12098933590783013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,2560,0.1470995611614651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,1536,0.09640177753236558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,512,0.021640888518757288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,256,0.01757333344883389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,128,0.01478666729397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,768,0.05755644374423557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,512,0.04602577620082431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,64,0.01238933371173011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,32,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,128,0.03369155526161194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,64,0.03278755479388767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,32,0.03271822134653727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,7168,3072,0.11051911115646362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,1024,0.0716480016708374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,256,0.03712711069318984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,65536,4.456128862169054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,16384,0.45503997802734375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,51200,1.4299324883355036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,12288,0.3416951232486301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,7168,51200,3.4580133226182728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,65536,1.9222496880425348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,10240,0.2984631061553955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,8192,0.2203608883751763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,16384,0.8503688706292046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,7168,0.19610310925377739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,12288,0.6508062150743272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,6144,0.17733066611819795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,10240,0.5764826668633355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,7168,0.36977510982089573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,5120,0.15551111433241102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,6144,0.3211217721303304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,4096,0.11744888623555501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,5120,0.2677653365665012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,3584,0.09671822521421646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,4096,0.21779289510515001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,3072,0.0857342216703627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,3584,0.1795226732889811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,2560,0.07358755668004353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,2048,0.05589689148796929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,3072,0.15538044770558676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,2560,0.1338640054066976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,1536,0.043637331989076406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,1024,0.029827555020650227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,2048,0.11295644442240398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,768,0.023178666830062866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,1536,0.08768000205357869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,512,0.018067555295096505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,1024,0.06488355663087633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,256,0.014146667387750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,128,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,768,0.053251554568608604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,51200,3.052833769056532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,512,0.04138844543033176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,256,0.033569776349597506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,8192,0.4464471075269911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,32,0.010728889041476779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,128,0.029891557163662378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,64,0.031181332137849595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,32,0.029463112354278564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,6144,65536,4.018057081434462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,16384,0.36719645394219297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,12288,0.292592896355523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,6144,64,0.01073066641887029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,51200,1.1695955064561632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,16384,0.7896444532606336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,10240,0.25692889425489635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,8192,0.20392444398668078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,65536,1.4893004099527996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,7168,0.16357510619693333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,6144,0.14305955833858913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,12288,0.6212631331549751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,10240,0.4820924335055881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,8192,0.3890106678009033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,5120,0.1228826708263821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,4096,0.09963999854193793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,7168,0.38093066215515137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,3584,0.08978311220804851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,5120,0.24563911226060656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,6144,0.3202515443166097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,3072,0.06881955597135755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,4096,0.1886568864186605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,2560,0.06224799818462796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,2048,0.05057422320048014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,1536,0.03628888726234436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,1024,0.02732533382044898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,3072,0.16039021809895834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,2560,0.12793689303927952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,768,0.024479111035664875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,2048,0.10059911012649536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,1536,0.0819973349571228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,512,0.01905155513021681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,256,0.012851555314328937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,1024,0.059079110622406006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,768,0.04812177684572008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,512,0.03727022144529555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,64,0.009425777528021071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,256,0.0302800006336636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,32,0.009710222482681274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,128,0.027087999714745417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,64,0.02676533328162299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,32,0.0269822229941686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,51200,2.7723511589898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,16384,0.29769688182406956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,3584,0.16378222571478948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,5120,65536,3.5474107530381946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,51200,0.8421297603183322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,12288,0.20465600490570068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,65536,1.1501679950290256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,5120,128,0.011019555230935415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,10240,0.20309689309861925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,8192,0.15878933005862766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,16384,0.8129875395033094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,12288,0.5310266812642416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,10240,0.4383937782711453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,6144,0.10967822207344903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,5120,0.09075111150741577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,7168,0.332893345091078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,4096,0.07741066482332018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,6144,0.2669680118560791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,4096,0.1787093347973294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,3072,0.05494133300251431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,3584,0.15004977915022108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,2560,0.04621244470278422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,3072,0.13004355960422093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,51200,2.378072950575087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,7168,0.14559911357031927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,2048,0.037603557109832764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,2560,0.11045689053005642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,1536,0.03088888857099745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,1024,0.021320889393488567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,2048,0.08949777815077041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,1536,0.07287200291951497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,768,0.01703377730316586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,1024,0.053103112512164645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,65536,3.021802690294054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,256,0.010348444183667501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,5120,0.22377777099609375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,768,0.04321777820587158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,128,0.008969777988062965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,512,0.0333555539449056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,64,0.007954667011896769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,32,0.008002666963471307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,128,0.024173332585228816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,64,0.023987554841571387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,32,0.02349777850839827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,8192,0.3523840109507243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,512,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,51200,0.820067564646403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,4096,3584,0.0627653333875868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,16384,0.26599378055996364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,4096,256,0.026408000124825373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,12288,0.1849599944220649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,10240,0.17140621609157988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,8192,0.1439031097624037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,10240,0.41895378960503477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,12288,0.4991360240512424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,16384,0.8450711038377551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,7168,0.11599022812313503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,6144,0.10391644636789958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,5120,0.08188266886605157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,8192,0.3588346640268962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,4096,0.0643484459982978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,7168,0.2962791124979655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,65536,0.9461004469129773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,6144,0.2530408965216743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,3072,0.04814755585458544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,5120,0.21221778127882215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,4096,0.1676417721642388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,2560,0.04052711195415921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,2048,0.035537779331207275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,3584,0.1416977776421441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,3072,0.122597336769104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,1536,0.02664622167746226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,1024,0.020082667469978333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,2560,0.10565244489245945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,2048,0.08541688654157852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,768,0.016031111280123394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,512,0.012343111137549082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,1536,0.0688755578464932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,256,0.00959822204377916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,128,0.008330666356616551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,768,0.04021599888801575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,512,0.031135112047195435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,64,0.007780444290902879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,65536,2.8046222262912326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,32,0.007948444121413762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,51200,2.1914605034722223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,128,0.022655111220147874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,64,0.021996445126003687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,32,0.022545778089099463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,16384,0.2548248767852783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3584,3584,0.056223114331563316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,12288,0.16452266110314265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,51200,0.7195128864712186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,65536,0.9953413009643555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,10240,0.17890400356716582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,1024,0.04930666751331753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,16384,0.6624319818284776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,8192,0.13780266708797878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3584,256,0.024679111109839544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,12288,0.4669404559665256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,7168,0.11228177282545303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,6144,0.09120000070995754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,5120,0.07797244522306654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,8192,0.31672443283928764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,10240,0.42986310852898496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,4096,0.06140622165468004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,3584,0.058182219664255776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,7168,0.30320265558030873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,6144,0.2389777766333686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,3072,0.05052711235152351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,5120,0.19783555136786568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,2560,0.04088266690572103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,2048,0.03410844339264764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,1536,0.0236799998415841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,3584,0.1359297831853231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,3072,0.12366578314039443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,1024,0.01666755477587382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,2560,0.1001582211918301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,768,0.013537777794731988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,512,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,1536,0.06174666351742215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,1024,0.04701866706212362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,768,0.03868710994720459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,51200,2.0586026509602866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,128,0.008282666405042013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,256,0.023028444912698533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,64,0.007258666886223688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,128,0.02128622266981337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,32,0.007647111184067196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,65536,2.5927776760525174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,32,0.020688888099458482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,4096,0.1549031072192722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,2048,0.08079999685287476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,3072,256,0.009016888837019602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,65536,0.675797356499566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,512,0.02982399861017863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,16384,0.18818044662475586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,12288,0.14609866672092015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,10240,0.12611733542548284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,3072,64,0.020581333173645865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,8192,0.09385155306922065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,16384,0.6131022241380479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,12288,0.44449424743652344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,7168,0.08851022190517849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,10240,0.3711262279086643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,6144,0.07117155525419447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,8192,0.30124089452955455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,5120,0.05789955457051595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,7168,0.264448881149292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,3584,0.0432515541712443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,6144,0.22628532515631783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,3072,0.03754666778776381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,4096,0.14914666281806097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,5120,0.18793155087365043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,2560,0.03106488784154256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,3584,0.12718933158450657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,2048,0.026007999976476032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,51200,0.5994488928053114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,1536,0.02032177812523312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,3072,0.10950755410724217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,2560,0.09304266505771214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,1024,0.014803555276658801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,768,0.012341332932313284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,512,0.009722666607962714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,1536,0.05841422080993652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,65536,2.4172950320773654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,1024,0.04379644327693515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,256,0.007280000381999546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,128,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,512,0.027814222706688776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,64,0.006630222416586346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,32,0.006716444260544247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,128,0.019849777221679688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,256,0.021662222014533147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,64,0.019276445110638935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,32,0.01924444403913286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2560,4096,0.04599110947714912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,16384,0.15215288268195257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,51200,0.4514195654127333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,65536,0.5503688918219672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,12288,0.10870755381054348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,10240,0.09508888589011298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,2048,0.07564089033338758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,51200,1.8748772939046223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2560,768,0.03626222080654568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,8192,0.07077333662245008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,12288,0.463988463083903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,7168,0.06876889202329847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,6144,0.05731822384728325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,10240,0.37053688367207843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,7168,0.25000977516174316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,8192,0.2831973234812419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,6144,0.21387199560801187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,4096,0.03749955693880717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,3584,0.03415911065207587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,5120,0.1813911067114936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,3072,0.028809779220157202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,2560,0.02606311109330919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,4096,0.13811822732289633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,2048,0.02176355487770504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,3072,0.10497955481211345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,2560,0.08775733576880561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,1536,0.01805688937505086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,51200,1.744050661722819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,1024,0.013284444808959961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,2048,0.0715235537952847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,768,0.011360000405046674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,512,0.009333333207501305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,1536,0.056530667675866016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,1024,0.039678222603268094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,256,0.00833155545923445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,768,0.033278223541047834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,128,0.00591466658645206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,512,0.026603556341595117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,64,0.005215999980767568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,32,0.005552000055710475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,256,0.020591111646758187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,16384,0.5557502110799154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,128,0.018555555078718398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,64,0.017858665850427415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,32,0.017859554953045316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,2048,5120,0.04571288824081421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,16384,0.12189600202772354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,51200,0.3427751064300537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,65536,0.4582799805535211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,12288,0.08698578013314141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,3584,0.11966489420996772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,16384,0.5204835467868382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,12288,0.41185333993699813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,8192,0.06583378050062391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,10240,0.3313235441843669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,7168,0.05723377731111315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,2048,65536,2.23600705464681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,6144,0.0484426650736067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,5120,0.037772443559434675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,8192,0.27006133397420246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,7168,0.2349946763780382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,4096,0.028836445675955877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,6144,0.20170133643680146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,3584,0.026131555438041687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,3072,0.024163555767801072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,5120,0.16694311300913492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,2560,0.0203795548942354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,4096,0.1302257776260376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,51200,1.6221751107109919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,2048,0.016584888100624084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,3072,0.09714577595392863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,2560,0.08261777957280476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,10240,0.07517511314815946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,1024,0.01033155537313885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,768,0.0087013335691558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,2048,0.06772444645563762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,1536,0.052684442864524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,512,0.006937777830494775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,256,0.005899555567238066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,1024,0.0369777778784434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,65536,2.073394563462999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,128,0.005595555735958948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,768,0.03136444422933791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,512,0.024693333440356787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,64,0.005218666460778978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,256,0.01889955500761668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,128,0.01716977854569753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,64,0.016507556041081745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,32,0.016164445214801364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,16384,0.0815111133787367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,65536,0.30615822474161786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,51200,0.24688267707824707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,12288,0.06688533226648967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,10240,0.05087822344568041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1536,3584,0.11239200168185765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,12288,0.37985510296291775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,1536,0.013813333378897773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,16384,0.4891644583808051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,8192,0.04066310988532172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,10240,0.3238737848069933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,6144,0.02944533361328973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,5120,0.025281776984532673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,8192,0.2560959921942817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,7168,0.2201706700854831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,4096,0.020908445119857788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1536,32,0.004912888838185204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,5120,0.1565706729888916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,3584,0.018575999471876357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,3072,0.01685688893000285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,2560,0.014212444424629211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,4096,0.12144977516598171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,3584,0.10543288787206014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,3072,0.09114933013916016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,1536,0.010176888770527309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,2560,0.07689155472649468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,51200,1.5035084618462458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,1024,0.008336000144481659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,768,0.007284444239404466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,2048,0.06287999947865804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,1536,0.04790755444102817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,512,0.00627377794848548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,256,0.004921777794758479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,768,0.02901511059867011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,65536,1.9261279635959203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,128,0.004600888739029567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,64,0.003953777667548922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,256,0.017501332693629794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,32,0.004200889004601372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,7168,0.03450489044189453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,128,0.015460444821251763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,64,0.014819555812411837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,32,0.0148053334818946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,65536,0.24020799001057944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,51200,0.20958756075965035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,6144,0.19885155889723036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,16384,0.06390666961669922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,12288,0.047445333666271634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,10240,0.041322665082083807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,1024,2048,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,8192,0.030360887447992962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,12288,0.356964455710517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,16384,0.46927642822265625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,10240,0.2990017731984456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,7168,0.025635555386543274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,1024,0.03426311082310147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,6144,0.02386133372783661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,5120,0.01983644399378035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,1024,512,0.02290488945113288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,4096,0.016584000653690763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,7168,0.21182310581207275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,6144,0.1824044386545817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,3584,0.014849777022997538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,5120,0.1504560046725803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,4096,0.11706844965616862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,3584,0.10059911012649536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,2560,0.011815999945004782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,2048,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,3072,0.08648177650239731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,1536,0.00867555538813273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,51200,1.4429155985514324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,2560,0.07357600000169542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,1024,0.0069448889957533936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,2048,0.05951822466320462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,768,0.006248888870080312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,512,0.005214222189452913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,1536,0.044871111710866295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,256,0.004512888689835866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,1024,0.03281689021322463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,65536,1.8424888186984594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,768,0.027803556786643133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,128,0.0041724443435668945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,512,0.021988444858127173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,64,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,256,0.01648533344268799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,32,0.004184000194072723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,128,0.014831999937693277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,32,0.014132445057233175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,8192,0.24124532275729707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,65536,0.20982310507032606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,51200,0.16778577698601616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,16384,0.05725600322087606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,12288,0.04371910956170824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,10240,0.03298844562636481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,768,3072,0.013519110778967539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,8192,0.026307556364271376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,12288,0.34631554285685223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,16384,0.45769331190321183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,7168,0.023690667417314317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,10240,0.2910488976372613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,6144,0.020933333370420668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,8192,0.23505422804090711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,5120,0.018057778477668762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,4096,0.01484266585773892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,7168,0.20599733458624947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,6144,0.17768711513943145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,3584,0.013807111316257052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,5120,0.146323561668396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,3072,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,4096,0.11341333389282227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,2560,0.01072355525361167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,2048,0.009358222285906473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,768,64,0.014436443646748861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,3584,0.09793511364195083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,1536,0.008282666405042013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,3072,0.0839608907699585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,1024,0.0064737776087390045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,2560,0.07141333156161837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,768,0.005608888963858287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,2048,0.057504885726504855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,512,0.005225777626037598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,51200,1.4029377831353083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,256,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,1536,0.043106665213902794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,1024,0.031806220610936485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,128,0.003917333152559069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,64,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,512,0.02130844526820713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,512,32,0.0038604442444112566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,256,0.015817777978049386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,128,0.013783999615245394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,65536,1.7908488379584417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,64,0.013793778088357715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,65536,0.12548444006178114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,16384,0.039213332864973284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,51200,0.09973066382937962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,12288,0.025489777326583862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,10240,0.020346666375796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,8192,0.01685599982738495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,10240,0.2788631121317546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,12288,0.3315040005577935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,16384,0.4383848773108588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,8192,0.22517421510484484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,7168,0.015217777755525378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,6144,0.01367111090156767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,5120,0.011746666497654386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,4096,0.010336000058386061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,7168,0.19763378302256265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,6144,0.17021600405375162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,3584,0.009348444640636444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,3072,0.008622222476535374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,768,0.02674399978584713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,4096,0.10878933138317531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,5120,0.1399137841330634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,2560,0.007937777373525832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,2048,0.0069439998931354946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,3584,0.09326933489905463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,1536,0.006217777729034424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,3072,0.08015644550323486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,512,32,0.013196444345845116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,1024,0.005199999858935674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,51200,1.3425458272298176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,2048,0.05452533231841194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,768,0.004580444345871608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,512,0.0041759999261962045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,1536,0.04150222076310052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,256,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,128,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,1024,0.0302471121152242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,768,0.02570844524436527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,64,0.003559999995761447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,256,32,0.0035706667436493766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,256,0.015486222174432544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,128,0.013437333206335703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,64,0.012847111456924014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,65536,0.0841182205412123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,32,0.012478222449620565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,51200,0.06812000274658203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,16384,0.028685334655973647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,12288,0.01958933307064904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,12288,0.32395821147494847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,16384,0.42824533250596786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,10240,0.017501332693629794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,8192,0.013182222015327878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,2560,0.06783999999364217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,7168,0.012114666402339935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,10240,0.2719208929273817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,512,0.020277332928445604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,6144,0.010631110933091907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,8192,0.21972889370388457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,5120,0.00941955546538035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,256,65536,1.713746706644694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,4096,0.008186666501892937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,7168,0.1929262214236789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,3584,0.007612444460391998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,3072,0.006792000184456508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,6144,0.16557244459788004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,5120,0.13696711593204075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,51200,1.3081981870863173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,4096,0.10635199811723496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,2560,0.005953777581453323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,2048,0.005586666779385672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,3584,0.09108533461888631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,1536,0.004919111314747068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,1024,0.004230222354332606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,3072,0.07762489053938124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,768,0.004181333300140169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,2560,0.06596355305777656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,2048,0.052516443861855396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,65536,1.6738541920979817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,1536,0.03943466809060838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,256,0.0032275555034478507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,128,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,768,0.025019556283950806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,64,0.0028453332682450614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,512,0.019914666811625164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,32,0.0028000000036425064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,256,0.014495111174053617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,128,0.012963555753231049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,64,0.01237511138121287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,65536,0.07998933394749959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,32,0.012447111308574677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,51200,0.06482666730880737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,16384,0.02471911079353756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,12288,0.015466666883892484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,10240,0.013125333521101209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,12288,0.32386665874057347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,16384,0.42767998907301163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,10240,0.27178311347961426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,7168,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,6144,0.010377777947319878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,8192,0.21965600384606254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,7168,0.19294933478037515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,128,512,0.003572444534964032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,5120,0.009011555876996782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,128,1024,0.0295688874191708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,6144,0.1657386620839437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,3584,0.007320000065697565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,3072,0.006572444405820634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,5120,0.13675555917951795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,4096,0.10587466425365871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,2560,0.006208000083764394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,3584,0.09059466918309529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,2048,0.00526311124364535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,3072,0.07789333661397298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,1536,0.004552888787455029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,51200,1.3098666932847765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,1024,0.004202666795916027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,768,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,2048,0.05269777774810791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,1536,0.040018667777379356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,512,0.003536888708670934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,1024,0.02939288814862569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,768,0.025040000677108765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,65536,1.673450681898329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,128,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,64,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,512,0.01960444450378418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,256,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,8192,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,32,0.0028808888875775864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,128,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,64,0.012088889049159156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,65536,0.07606933514277141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,32,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,51200,0.06151377492480808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,16384,0.023806222611003455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,12288,0.012763555679056378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,4096,0.007939555578761632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,10240,0.012230222423871359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,16384,0.42788089646233457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,8192,0.010106667048401302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,10240,0.27129867341783315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,64,2560,0.06572177675035265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,7168,0.009945777555306753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,6144,0.009038222332795462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,64,256,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,5120,0.011613333390818702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,8192,0.21916622585720488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,4096,0.009653333160612319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,7168,0.19276177883148193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,6144,0.16571822431352404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,3584,0.009183111290136972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,3072,0.00793599999613232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,5120,0.13638844754960802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,4096,0.10511110888587104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,51200,1.310023095872667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,2048,0.0052586665583981415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,2560,0.06584266821543376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,1536,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,65536,1.6729315651787653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,2048,0.05244622296757168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,1024,0.004201777693298128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,768,0.0035413333939181436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,1536,0.04032266802257962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,512,0.003216000066863166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,12288,0.3231484360165066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,1024,0.029245333539115057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,256,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,768,0.024680000212457445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,128,0.0028826666788922418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,64,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,512,0.01956533392270406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,256,0.0144533332851198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,32,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,128,0.01240533341964086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,64,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,32,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3585,32,2560,0.007291555404663086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,3584,0.09108799695968628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3585,32,3072,0.07796621984905668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,12288,3.277928034464518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,16384,4.345241970486112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,12288,3.8180194430881076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,16384,5.336726294623481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,16384,4.930242750379774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,10240,3.000260459052192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,10240,3.1354054345024953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,12288,3.566075642903646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,8192,2.4112523396809897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,10240,3.0211003621419272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,8192,2.427415211995443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,7168,2.065526326497396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,8192,2.4739803738064237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,6144,1.6759075588650172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,7168,2.0865796407063804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,7168,2.142123540242513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,6144,1.8250772688123915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,5120,1.3304915957980685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,5120,1.519526269700792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,6144,1.8507376776801214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,51200,14.039096408420138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,4096,1.085728857252333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,3584,0.9477929009331597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,4096,1.1993066999647353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,5120,1.5035510592990453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,3584,1.0582951439751518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,4096,1.191189342074924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,3584,1.0404693815443251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,3072,0.8364159795973035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,3072,0.8907146453857422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,2560,0.7169991069369845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,2048,0.5454079839918349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,2560,0.7950293223063151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,3072,0.8834640185038248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,2048,0.6198995378282335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,1536,0.41903021600511337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,2560,0.7316915724012586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,1024,0.2629804346296522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,1536,0.5014524459838867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,768,0.21151467164357504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,2048,0.6497431331210667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,1536,0.48571109771728516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,1024,0.3681760099199083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,1024,0.5177377594841851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,512,0.17086754904852974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,768,0.2911715507507324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,768,0.343539555867513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,256,0.16397778193155924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,512,0.25483910242716473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,512,0.24705065621270073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,128,0.13816266589694554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,256,0.2571022245619032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,256,0.19287999471028647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,64,0.10727110836240981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,128,0.14613600571950278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,128,0.21175732877519396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,65536,32,0.0972106655438741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,64,0.21574578020307753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,32,0.21403466330634224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,65536,51200,16.587736341688366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,65536,51200,22.892498440212673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,16384,3.4065723419189453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,16384,4.321702321370442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,51200,11.053010728624132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,12288,2.5861733754475913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,16384,3.9495574103461375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,65536,13.561122470431856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,12288,3.0588506062825522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,10240,2.303548389010959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,12288,2.861878289116753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,10240,2.530085245768229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,8192,1.8656461503770616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,10240,2.44339476691352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,8192,2.0145350562201605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,51200,17.97428215874566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,7168,1.5488693449232314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,51200,13.306682162814669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,6144,1.3743421766493056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,7168,1.7625315984090169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,8192,1.922392103407118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,7168,1.7113013797336156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,5120,1.0989564259847004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,6144,1.4467804167005751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,5120,1.2462426291571724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,4096,0.8975999620225695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,65536,21.559805976019963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,6144,1.4269662433200414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,3584,0.7476240264044868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,4096,0.9841689003838433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,5120,1.1950551138983834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,4096,0.9527795579698352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,65536,16.753814697265625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,3072,0.7127760251363119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,3584,0.952755504184299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,3072,0.7903893258836535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,3584,0.8004159927368164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,2048,0.4862826665242513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,2560,0.6357030868530273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,3072,0.7001733250088162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,2048,0.5098835627237955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,1536,0.32387733459472656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,1024,0.22255555788675943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,2560,0.6931111017862955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,768,0.17496089140574136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,2048,0.5002826584710015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,1536,0.5161137580871582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,1024,0.2956799930996365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,1536,0.3880799876319037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,512,0.13445156150394016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,1024,0.3366568883260091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,256,0.09015733003616333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,2560,0.5674515300326878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,128,0.08185155524147882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,512,0.21357333660125732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,768,0.275888893339369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,256,0.1663128932317098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,64,0.06484622425503202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,51200,32,0.07156178024080065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,768,0.24256443977355957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,128,0.12069333924187554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,64,0.1701457765367296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,128,0.16430755456288657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,32,0.1699288951026069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,51200,512,0.19360266791449654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,51200,256,0.1776826646592882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,16384,1.1791120105319552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,16384,1.6124408509996202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,12288,0.7981680234273275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,51200,3.7645412021213107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,65536,4.601313696967231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,12288,1.1949084599812825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,10240,0.8492382367451986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,12288,1.221576902601454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,16384,1.6383778254191081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,10240,0.970462269253201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,8192,0.6229919857449001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,51200,6.5805553860134545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,8192,0.7714311281840006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,51200,5.218465593126085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,7168,0.5390186839633518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,10240,0.9877502653333875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,8192,0.7871404223971896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,6144,0.4677297804090712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,7168,0.6916115548875598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,5120,0.32843467924329967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,7168,0.6911342408921984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,6144,0.6336800257364908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,65536,7.8734529283311625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,6144,0.5982960065205892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,4096,0.29074843724568683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,3584,0.2473155657450358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,5120,0.4999590979682074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,5120,0.5027199851142036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,4096,0.41686132219102645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,3072,0.2140453391604953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,65536,6.699224683973525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,3584,0.33414578437805176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,3072,0.29604710472954643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,2560,0.1615413294898139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,3584,0.37931733661227757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,3072,0.31422222985161674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,2048,0.14248177740308973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,2560,0.27548087967766655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,2560,0.2657324473063151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,1536,0.11743288569980198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,2048,0.20108266671498617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,1024,0.08300533559587267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,1536,0.15647021929423013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,768,0.06535289022657606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,1536,0.1804035504659017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,1024,0.11841244167751735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,1024,0.135824892255995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,512,0.05166666706403097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,256,0.040904889504114784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,768,0.09492977460225423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,4096,0.38063645362854004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,512,0.09029510948393081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,512,0.07850222455130683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,128,0.029828445778952703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,256,0.0697831114133199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,256,0.0675813357035319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,128,0.055128001504474215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,128,0.06288355588912964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,32,0.027042667071024578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,64,0.06325244241290622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,16384,32,0.0638657808303833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,2048,0.22268443637424043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,16384,768,0.11132178041670059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,16384,64,0.025286222497622173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,16384,0.8162950939602323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,16384,1.300472895304362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,51200,2.6451057857937283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,12288,0.5813537703620063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,65536,3.386058595445421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,16384,1.3661058213975694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,10240,0.5597350862291124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,12288,0.9603706995646158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,8192,0.3864275614420573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,10240,0.8002657890319824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,12288,1.0000719494289823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,7168,0.3426640033721924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,8192,0.6504293547736274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,10240,0.8395146793789334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,8192,0.6730737686157227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,51200,4.999372270372179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,7168,0.5560631222195095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,6144,0.35557066069708926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,7168,0.5938453144497341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,5120,0.2899991141425239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,6144,0.4709155294630263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,51200,4.373847961425781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,5120,0.41883643468221027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,6144,0.5300373501247829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,4096,0.2233333322736952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,3584,0.17191289530860054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,4096,0.3061342239379883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,5120,0.43168621593051487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,3072,0.14537866910298666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,65536,6.762725406222874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,4096,0.3562142319149441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,3584,0.26795021692911786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,2560,0.1223706669277615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,3584,0.3277217812008328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,3072,0.23069689008924696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,2048,0.10007111231486003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,3072,0.26537156105041504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,2560,0.21204533841874865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,65536,5.614068349202474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,1536,0.08561688661575317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,2048,0.1644586722056071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,1024,0.06211022535959879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,2048,0.19266222582923043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,1536,0.15105156103769937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,1536,0.12867466608683267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,768,0.059154669443766274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,1024,0.11466222339206272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,512,0.04504177636570401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,1024,0.10315466589397854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,768,0.0806551112069024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,768,0.09722755352656047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,256,0.033871110942628645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,512,0.07788444227642484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,512,0.06463199853897095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,128,0.030445333984163072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,64,0.02774311105410258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,12288,32,0.029278222057554457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,256,0.05443466703097025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,256,0.06472355789608426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,128,0.0479911102188958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,128,0.05123555660247803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,64,0.05096711052788628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,12288,32,0.05139644609557258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,12288,2560,0.22792532708909777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,16384,0.7253653208414713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,51200,2.1576294369167752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,65536,2.745023939344618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,16384,1.206774181789822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,12288,0.5542391141255697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,12288,0.8450186517503527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,10240,0.47965865665011936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,16384,1.2371181911892362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,12288,0.9130356046888563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,8192,0.33796532948811847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,51200,4.332940419514974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,8192,0.5628213352627224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,7168,0.305947568681505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,10240,0.7887866761949328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,51200,3.9149157206217446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,8192,0.6297618018256294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,6144,0.252745787302653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,7168,0.4894560178120931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,5120,0.2317582236395942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,6144,0.4318488968743219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,7168,0.5735004213121202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,65536,5.695855034722222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,10240,0.7032364209493002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,6144,0.46938313378228086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,4096,0.1736888885498047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,3584,0.15872977839575872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,4096,0.2751733462015788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,5120,0.45713334613376194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,3072,0.14076799816555446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,3584,0.2376871109008789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,65536,5.104949527316623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,4096,0.3395964569515652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,3584,0.30122489399380153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,2560,0.10876711209615071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,2048,0.09418044487635295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,3072,0.20665866798824736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,1536,0.06772444645563762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,2560,0.17585955725775826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,2048,0.14795733822716609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,2048,0.1723466714223226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,2560,0.223183102077908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,768,0.04007377889421251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,1536,0.11488000551859538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,1024,0.11009155379401313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,1024,0.08716177940368652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,512,0.028508444627126057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,768,0.08854399787055121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,768,0.07119644350475736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,256,0.02193333374129401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,512,0.05762488974465264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,512,0.07328444719314575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,5120,0.3477928903367784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,128,0.019631110959582858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,256,0.04746311240726047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,256,0.055352889829211764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,64,0.01686311099264357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,32,0.01682222220632765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,128,0.04419733418358696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,128,0.04532533221774631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,64,0.043903999858432345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,10240,32,0.043552001317342125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,3072,0.24694487783643934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,10240,1024,0.049711998966005116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,10240,1536,0.14108444584740534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,16384,0.6225235727098253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,16384,0.9870648913913302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,51200,1.954482608371311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,12288,0.49829689661661786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,65536,2.5165928734673395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,16384,1.1197919845581055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,10240,0.37737690077887637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,12288,0.7513226403130425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,8192,0.24002578523423937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,12288,0.8453431129455566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,10240,0.618359989590115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,7168,0.26613956027560765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,8192,0.49886221355862087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,51200,3.7449735005696616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,10240,0.7756409115261502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,6144,0.19956799348195395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,8192,0.5616738001505533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,7168,0.4717369079589844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,6144,0.3678773244222005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,5120,0.1942044496536255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,7168,0.4968115488688151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,4096,0.11991466416252984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,6144,0.45510313245985246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,65536,4.7700072394476996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,51200,3.5025831858317056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,4096,0.23772801293267143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,3584,0.11749511294894749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,5120,0.3584391011132135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,3072,0.11520266532897949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,4096,0.2991280025906033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,3584,0.2200026644600762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,2560,0.08119910955429077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,3584,0.25619199540879994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,3072,0.18767910533481172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,3072,0.22058222028944227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,2048,0.06981155607435438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,1536,0.05990578068627251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,2560,0.16174222363366023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,2560,0.1907893286810981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,65536,4.486005147298177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,2048,0.1288871102862888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,2048,0.15705955028533936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,768,0.0313297775056627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,1536,0.12915999359554714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,1024,0.09685333569844563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,1024,0.07686222261852689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,768,0.061807996696896024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,512,0.02664799988269806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,768,0.08102044132020739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,256,0.021336888273557026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,512,0.049920890066358775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,512,0.0651786658498976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,5120,0.3138764434390598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,128,0.016866667403115165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,256,0.04983555608325534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,256,0.039860443936453924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,64,0.014084445105658637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,32,0.015947555502255756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,8192,128,0.040030221144358315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,128,0.036023110151290894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,64,0.03581155671013726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,32,0.03497511148452759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,8192,1024,0.04032889008522034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,8192,1536,0.10127288765377468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,16384,0.5197697745429145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,51200,1.6731475194295247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,65536,2.1164489322238498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,12288,0.41100443734063047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,16384,0.9417751100328234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,10240,0.3358951144748264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,16384,1.040071063571506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,12288,0.7437546518113879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,12288,0.8072897593180338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,8192,0.26475289132859975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,10240,0.6111324628194174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,51200,3.4131431579589844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,10240,0.6513537830776638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,7168,0.2388817734188504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,8192,0.455168883005778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,6144,0.20312799347771537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,7168,0.4080062177446153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,7168,0.4651893509758844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,6144,0.3421413368648953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,5120,0.1610764397515191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,65536,4.377301534016927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,4096,0.12442221906450059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,51200,3.2309750450981984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,6144,0.42730222807990176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,5120,0.2828257878621419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,3584,0.1141973336537679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,5120,0.3361839983198378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,4096,0.2291004392835829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,3072,0.09654400083753799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,3584,0.1931626664267646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,2560,0.08149511284298368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,3584,0.2363671196831597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,3072,0.16815466350979277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,2048,0.06808355781767103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,3072,0.20965154965718588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,2560,0.1450035572052002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,1536,0.05310488740603129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,8192,0.5338906712002224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,2048,0.1181288825141059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,1024,0.03484355409940084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,1536,0.09395644399854873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,1536,0.11927110619015163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,768,0.027067555321587458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,1024,0.09103822045856053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,1024,0.07022044393751356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,512,0.020103999310069613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,768,0.05671377976735433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,768,0.07643022139867146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,256,0.019332443674405415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,512,0.04490400022930569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,128,0.014038221703635322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,256,0.03535111082924737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,256,0.04782399866316053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,64,0.015171556009186639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,128,0.032531556155946516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,128,0.038049777348836265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,7168,32,0.01577333278126187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,4096,0.28006309933132595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,64,0.03194400005870395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,7168,32,0.03183822168244256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,65536,4.146606021457248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,2560,0.18298044469621447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,2048,0.14704533418019614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,7168,512,0.061808890766567655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,16384,0.4654071066114638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,51200,1.4328933291965062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,16384,0.847541332244873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,65536,1.9675636291503906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,12288,0.35152623388502335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,12288,0.6418622334798177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,16384,0.9959199693467883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,10240,0.2979751163058811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,12288,0.7476648754543729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,8192,0.21771644221411812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,51200,3.049950281778971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,10240,0.5217510859171549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,7168,0.19740977552202013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,10240,0.6260017818874782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,8192,0.41962488492329914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,7168,0.36698489718967015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,65536,3.8706864251030813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,8192,0.5369235674540201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,51200,3.0812284681532116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,5120,0.13860978020562068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,6144,0.3164942264556885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,4096,0.10854933659235637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,6144,0.38638665941026473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,5120,0.26664890183342826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,3584,0.10354222191704644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,5120,0.3223324351840549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,4096,0.205457780096266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,3072,0.08678133620156182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,4096,0.2900497648451063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,3584,0.17881511317359078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,2560,0.0708035561773512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,3584,0.226548433303833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,3072,0.15429333845774332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,65536,3.951870388454861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,2048,0.05853866868548923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,3072,0.19784533977508545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,2560,0.13293688827090794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,2560,0.17400711112552217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,2048,0.10929510990778606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,2048,0.14351644780900744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,1024,0.031120889716678198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,1536,0.08693866597281562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,6144,0.1762871079974704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,1536,0.11378222041659886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,512,0.018054222067197163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,1024,0.06448177496592204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,768,0.07351199785868327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,768,0.051966223451826304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,7168,0.4552453358968099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,256,0.018751111295488145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,512,0.04042933384577433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,128,0.016490666402710807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,512,0.05906222263971964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,64,0.01516533394654592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,256,0.04451555675930447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,256,0.032279110617107816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,128,0.034627556800842285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,32,0.015576889117558798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,64,0.02944799926545885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,32,0.02897777822282579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,1536,0.04554933309555054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,6144,768,0.023690667417314317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,6144,1024,0.08824533224105835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,6144,128,0.029701332251230877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,16384,0.3526337676578098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,51200,1.2056435479058158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,12288,0.3023911052280002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,16384,0.7746604283650717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,16384,0.9402542114257812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,12288,0.7079528702629937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,65536,1.3201991187201607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,10240,0.2389119995964898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,8192,0.1937075588438246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,12288,0.6926337877909342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,10240,0.5083653132120768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,51200,2.696480009290907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,7168,0.16208710935380724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,10240,0.5833377838134766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,65536,3.364976035224067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,8192,0.41995734638637966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,6144,0.13965422577328152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,8192,0.4707484245300293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,5120,0.116175995932685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,7168,0.3517377906375461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,7168,0.4159066677093506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,6144,0.291686216990153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,4096,0.08944088882870144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,5120,0.2409155633714464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,6144,0.3660106658935547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,3584,0.07812800010045369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,5120,0.30340443717108834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,51200,2.8376613193088107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,3072,0.06672710842556424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,4096,0.18750488758087158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,2560,0.055629332860310875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,3584,0.1629155609342787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,3584,0.21249422762129042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,3072,0.14215021663241917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,2048,0.045331554280387036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,3072,0.18348888556162515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,1536,0.03398044572936164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,2560,0.1198844379848904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,2560,0.15808267063564724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,1024,0.02456533412138621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,2048,0.10150577624638875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,2048,0.132259554333157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,1536,0.0794080032242669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,768,0.01997511088848114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,1536,0.10615022314919366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,512,0.015448888142903646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,1024,0.05847466654247708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,1024,0.0808275540669759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,256,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,768,0.06863022512859769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,768,0.04671555426385668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,128,0.011018666956159802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,512,0.037167112032572426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,256,0.02944177720281813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,256,0.041909333732393056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,64,0.009711110757456886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,128,0.03302222159173753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,128,0.026752889156341553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,5120,32,0.009709333380063375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,64,0.02650755478276147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,5120,32,0.026358221968015034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,4096,0.24073333210415312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,65536,3.6396908230251737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,5120,512,0.055071999629338585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,51200,0.9711004892985026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,65536,1.3982284333970811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,16384,0.31389421886867946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,12288,0.24070223172505698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,16384,0.7099226845635308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,10240,0.19352711571587455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,12288,0.5305511156717936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,16384,0.9042124218410916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,8192,0.1607288916905721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,51200,2.3481725056966147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,12288,0.662027570936415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,10240,0.4360675546858046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,7168,0.13700711727142334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,10240,0.5593475765652126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,65536,3.071208953857422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,8192,0.35178399085998535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,6144,0.12046666940053304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,7168,0.3079955577850342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,5120,0.09917955266104804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,8192,0.4497937626308865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,4096,0.07947466770807902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,7168,0.39594756232367617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,6144,0.2658497757381863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,51200,2.708192825317383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,5120,0.21957066324022081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,6144,0.34291556146409774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,3584,0.07027377684911092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,5120,0.28509510887993705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,4096,0.17135911517673066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,4096,0.2284853458404541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,3584,0.14878755145602757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,2560,0.04741866721047295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,3584,0.200762669245402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,2048,0.03681244452794393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,3072,0.1751422219806247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,1536,0.028724445237053767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,65536,3.4585058424207897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,2560,0.14955377578735352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,2048,0.08914399809307522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,2048,0.12485510773128933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,1024,0.021891555852360193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,768,0.01702844434314304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,1536,0.07194666730033027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,1536,0.10091466373867458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,512,0.014144000079896716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,1024,0.051627556482950844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,1024,0.07709066735373603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,256,0.01057866629627016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,768,0.04270222120814853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,768,0.06473155816396077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,128,0.009179555707507664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,512,0.050718221399519176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,512,0.0326551099618276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,64,0.008625778059164682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,256,0.025793777571784124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,256,0.039460443788104586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,32,0.008661333057615492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,4096,128,0.03189422355757819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,64,0.02366311185889774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,32,0.02335111134582096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,4096,3072,0.05631999837027656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,3072,0.12802310784657797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,2560,0.10879288779364692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,16384,0.2818631066216363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,51200,0.8730666902330187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,65536,1.1097360187106662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,4096,128,0.02411199940575494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,12288,0.22287911838955352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,16384,0.6637839741177028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,10240,0.167684449089898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,12288,0.49207019805908203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,12288,0.6652204195658366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,16384,0.9007173114352756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,8192,0.1381466653611925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,10240,0.4254124429490831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,51200,2.2364044189453125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,10240,0.5345350901285807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,7168,0.11984533733791775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,8192,0.33635555373297793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,6144,0.10004266765382554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,8192,0.43320533964369035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,65536,2.8311449686686196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,7168,0.2920648786756727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,5120,0.08551644616656834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,7168,0.3807324568430583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,6144,0.25172445509168834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,4096,0.06395555867089166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,6144,0.32878843943277997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,51200,2.584586673312717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,5120,0.27505066659715444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,3584,0.06025422281689114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,3072,0.048093332184685596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,4096,0.16273510456085205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,4096,0.21851821740468344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,3584,0.14112799697452122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,2560,0.04217155443297493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,3584,0.19258399804433188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,3072,0.12190755208333333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,2048,0.034056001239352755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,3072,0.1677022245195177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,65536,3.3067298465304904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,1536,0.02750844425625271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,2560,0.10339999861187404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,1024,0.020262221495310467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,2048,0.11994489034016927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,2048,0.08490133285522461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,768,0.015649777319696214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,1536,0.09711822536256577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,1024,0.04965066578653124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,1024,0.07394933038287692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,512,0.012395555774370829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,768,0.06152266926235623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,768,0.04020355476273431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,256,0.010874666273593903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,512,0.031665778822369046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,512,0.048504001564449735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,5120,0.20786489380730522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,128,0.009315555294354757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,256,0.024663999676704407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,256,0.03775644302368164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,64,0.008635555704434713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3584,32,0.008967999782827165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,128,0.022341334157519873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,128,0.03113422128889296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,64,0.022307554880777996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,32,0.02234399980968899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3584,2560,0.14345867104000515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3584,1536,0.06835822264353435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,51200,0.7694577640957303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,16384,0.2500053246815999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,65536,1.0082035064697266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,12288,0.18182222048441568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,16384,0.6179173257615831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,12288,0.5402364201015896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,10240,0.15423999892340765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,12288,0.6227031283908421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,16384,0.8441751268174914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,8192,0.12962844636705187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,10240,0.3945128917694092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,51200,2.025871912638346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,7168,0.10582311285866632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,10240,0.5127937528822157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,8192,0.3164817757076687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,6144,0.09444622198740642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,8192,0.413832876417372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,7168,0.276310231950548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,5120,0.07727466689215766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,65536,2.6092213524712458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,6144,0.2374666796790229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,7168,0.3658897876739502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,4096,0.06063999732335409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,6144,0.31586488087972003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,3584,0.05371910995907254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,51200,2.464600033230252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,5120,0.1966924402448866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,4096,0.15404444270663792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,5120,0.26182312435574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,3072,0.048102223210864596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,4096,0.20942755540211996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,2560,0.041681776444117226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,3584,0.1344266732533773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,2048,0.03373333480623033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,3584,0.1847804387410482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,3072,0.11608533064524333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,1536,0.02737422287464142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,2560,0.0982639988263448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,2560,0.13720533582899305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,1024,0.017673777209387887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,2048,0.08103822337256537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,2048,0.11484532886081272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,768,0.013984888792037964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,1536,0.06099288993411594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,1536,0.09264177746242946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,512,0.011525332927703857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,1024,0.045201778411865234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,1024,0.07095999850167169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,65536,3.1536907619900174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,256,0.009016888837019602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,768,0.05810044209162394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,512,0.04658044377962748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,128,0.00794577764140235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,256,0.03628622161017524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,256,0.023031110564867657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,64,0.007050666544172499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,128,0.029847999413808186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,3072,32,0.0069226668112807805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,64,0.020463999774720933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,32,0.020640000700950623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,3072,3072,0.16061777538723415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,65536,0.6660115453932021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,768,0.03769333495034112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,512,0.029142220815022785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,51200,0.5559573173522949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,3072,128,0.020976000361972388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,16384,0.18057333098517525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,12288,0.12802933322058782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,12288,0.4398889011806912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,16384,0.5857671101888021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,10240,0.12154932816823323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,12288,0.5812017652723525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,16384,0.8004177941216363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,8192,0.09843555423948501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,10240,0.37129865752326113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,7168,0.08060089084837171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,10240,0.4873466491699219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,65536,2.416609870062934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,8192,0.3011111153496636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,6144,0.07015911075803968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,51200,1.8859812418619792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,8192,0.3954453203413222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,7168,0.26269422637091744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,5120,0.057736886872185596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,4096,0.04465333289570279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,6144,0.2255484528011746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,7168,0.34795112080044216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,3584,0.04207999838723076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,5120,0.18769421842363146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,6144,0.30152710278828937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,5120,0.25125598907470703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,3072,0.035016000270843506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,4096,0.14631733629438612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,4096,0.2005831135643853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,2560,0.028744889630211726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,3584,0.127128005027771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,3584,0.175744891166687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,2048,0.02533955540921953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,3072,0.11009511020448472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,3072,0.1532977819442749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,65536,3.000787523057726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,1536,0.019828443725903828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,2560,0.09250577953126694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,2560,0.13152266873253718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,1024,0.014750222365061441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,51200,2.3480105929904513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,768,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,2048,0.07569155428144667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,2048,0.1096995539135403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,512,0.009547555612193214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,1536,0.0576853354771932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,1024,0.06763822502560086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,1024,0.043473776843812734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,256,0.007323555648326874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,768,0.05669155385759142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,768,0.03559199968973795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,128,0.007075555622577667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,512,0.027463111612531874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,512,0.045976890458001025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,64,0.006281777802440856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2560,32,0.006284444282452266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,256,0.03539822167820401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,256,0.021873777111371357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,128,0.029361777835422095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,128,0.019606222709019978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,64,0.01920000049802992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2560,32,0.019160888261265226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,16384,0.16067555215623644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,51200,0.49798223707411027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,65536,0.6128871175977919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,12288,0.12835200627644858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,16384,0.5517182350158691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2560,1536,0.08837333652708267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,10240,0.10559022426605225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,12288,0.44515201780531144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,16384,0.7843342357211642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,8192,0.084279113345676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,12288,0.5766942236158583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,10240,0.3511813216739231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,7168,0.07453866799672444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,51200,1.7442382176717122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,10240,0.49053865008884007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,8192,0.28443288803100586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,6144,0.06356533368428548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,8192,0.3923964500427246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,7168,0.24870488378736708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,5120,0.052501334084404834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,65536,2.2246676550971136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,7168,0.3459635575612386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,4096,0.042938666211234204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,6144,0.29920978016323513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,5120,0.17672177155812582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,3584,0.039797332551744245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,51200,2.330990261501736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,5120,0.24813956684536406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,4096,0.13809155093299016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,3072,0.03440533412827386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,3584,0.12003644307454427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,3584,0.17394844690958658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,3072,0.10367821984820896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,2560,0.029537777105967205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,3072,0.15161866611904568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,2048,0.024479111035664875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,2560,0.08722400003009373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,2560,0.13038221995035806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,2048,0.07134133577346802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,65536,2.972977744208442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,2048,0.10868977838092381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,1536,0.019865777757432725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,1024,0.0144195556640625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,768,0.01180266671710544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,1536,0.0865280032157898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,1536,0.055832001898023814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,1024,0.039770666095945574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,512,0.00997688869635264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,768,0.032935112714767456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,6144,0.21375644207000732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,768,0.055326223373413086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,256,0.007311999797821045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,512,0.02570933269129859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,128,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,256,0.01994044416480594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,256,0.03428355521625943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,128,0.02809244394302368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,128,0.018236445056067575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,32,0.007634667058785756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,4096,0.19742133882310656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,64,0.017868444323539734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,2048,32,0.017698667115635343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,65536,0.455809752146403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,51200,0.3807982338799371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,1024,0.06554489003287421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,16384,0.12705777751074895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,2048,512,0.04353244437111748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,2048,64,0.007134222322040134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,12288,0.09098400010002984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,16384,0.5188417964511448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,10240,0.07776888873842028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,12288,0.3928062121073405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,16384,0.7270613246493869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,12288,0.5500782330830892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,8192,0.06518933508131239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,10240,0.32970576816134983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,7168,0.051544000705083214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,65536,2.068742116292318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,51200,1.618917359246148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,10240,0.46205510033501523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,8192,0.26660799980163574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,6144,0.04531022244029575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,5120,0.03936977850066291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,8192,0.3746595647599962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,7168,0.2339848942226834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,4096,0.029256890217463177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,7168,0.329802672068278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,6144,0.285187562306722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,5120,0.1661048862669203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,3584,0.026758222116364375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,5120,0.23715734481811523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,4096,0.12973511219024658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,3072,0.02307644486427307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,4096,0.1882151100370619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,3584,0.11238043838077122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,51200,2.214252471923828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,3584,0.16537422604031032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,2560,0.020374221934212577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,2048,0.016879111528396606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,65536,2.8256053924560547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,3072,0.09654488828447129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,1536,0.013594666288958656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,2560,0.08274044593175252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,2560,0.12418666150834824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,2048,0.06782933076222737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,1024,0.010334221853150262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,2048,0.10378666718800862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,768,0.008810666700204214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,1536,0.05202844407823351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,1536,0.08391200171576606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,512,0.006983111302057902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,1024,0.062069336573282875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,1024,0.036678221490648054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,768,0.05237155490451389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,256,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,128,0.005604444278611078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,512,0.042120890484915845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,512,0.024421332610978022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,256,0.018820444742838543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,64,0.004881777697139316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,128,0.016875555117925007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1536,32,0.005199111170238919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,6144,0.20118133227030435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,64,0.01649599936273363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,32,0.016318221886952717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,65536,0.3428186575571696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,3072,0.14447111553615993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,51200,0.27856000264485675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1536,768,0.03071911136309306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,16384,0.08773422241210938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,256,0.033538666036393903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1536,128,0.02708622150950962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,12288,0.06154221958584256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,16384,0.4884471363491482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,12288,0.36927111943562824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,10240,0.052520000272327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,16384,0.6883804533216688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,65536,1.9268692864312067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,51200,1.5060417387220595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,8192,0.04162755608558655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,12288,0.522508462270101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,10240,0.31000889672173393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,7168,0.03889333208401998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,10240,0.4382453229692247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,8192,0.25020000669691295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,6144,0.030759112702475652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,7168,0.21985156006283232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,8192,0.35557066069708926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,5120,0.026504889130592346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,7168,0.3132675488789876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,6144,0.18863644864824083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,6144,0.2716906600528293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,5120,0.15607466962602404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,3584,0.019945777124828763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,65536,2.677969826592339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,5120,0.22443911764356825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,4096,0.1225093338224623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,51200,2.103515625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,3072,0.017549332645204332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,4096,0.17954844898647734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,2560,0.015390222271283468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,3584,0.10523821910222371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,2048,0.013439999686347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,3584,0.15763200653923884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,3072,0.09052977959314983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,3072,0.13706044356028238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,1536,0.011413333316644033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,2560,0.11797689066992866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,1024,0.009306666751702627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,2048,0.06305955515967475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,2048,0.09866044256422256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,768,0.00795911086930169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,1536,0.07936533292134602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,1536,0.047720889250437416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,512,0.006597333484225803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,1024,0.05895377529991997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,1024,0.033943110042148165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,256,0.005579555614127054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,768,0.05017688870429993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,768,0.028492444091373022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,128,0.004549333204825719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,512,0.022682666778564453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,512,0.040377779139412776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,64,0.004549333204825719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,256,0.031501332918802895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,256,0.01717333330048455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,32,0.006256000035338932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,128,0.015455999308162265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,1024,128,0.025798221429189045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,64,0.014862222803963555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,32,0.014682667122946845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,1024,4096,0.022416000564893086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,51200,0.19386755095587838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,65536,0.2613226572672526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,16384,0.0673253337542216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,12288,0.05451822280883789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,1024,2560,0.07719822062386407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,16384,0.4803742302788629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,12288,0.3549484411875407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,10240,0.040123555395338274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,16384,0.6881484455532498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,8192,0.034310221672058105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,10240,0.29773155848185223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,12288,0.5193893114725748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,10240,0.4371688895755344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,7168,0.028412444723976985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,8192,0.2407440079583062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,6144,0.023990222149425085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,51200,1.4412106408013239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,8192,0.3534088929494222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,7168,0.21126043796539307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,5120,0.020918221937285528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,6144,0.18166400326622856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,65536,1.8440479702419703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,4096,0.016827555166350473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,6144,0.26954134305318195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,5120,0.14972533120049372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,3584,0.015483554866578845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,4096,0.11755200227101643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,5120,0.2234106593661838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,4096,0.17852355374230278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,3072,0.01387644476360745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,51200,2.092898686726888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,3584,0.10072088903850979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,2560,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,3584,0.1572293308046129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,3072,0.08642399973339504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,3072,0.13685333728790283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,2048,0.010671999719407825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,1536,0.009029332962301042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,2560,0.07329244746102227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,2048,0.059531556235419385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,2048,0.09813866350385879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,1024,0.007443555527263218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,65536,2.6715350680881076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,1536,0.0783440007103814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,768,0.006607999818192587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,1024,0.0588408907254537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,512,0.005593777944644292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,768,0.04948800139957004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,768,0.027422222826215956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,256,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,512,0.02199911077817281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,512,0.040159109565946795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,128,0.004226666771703296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,256,0.016662221815851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,256,0.03133422136306763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,64,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,128,0.02574577762020959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,128,0.014478221535682678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,768,32,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,64,0.014130666851997375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,32,0.014095111025704278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,65536,0.18348356088002524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,2560,0.11731199423472087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,51200,0.15830755233764648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,1536,0.04543911086188423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,16384,0.04764266808827718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,768,1024,0.03311466508441501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,768,7168,0.3117706775665283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,12288,0.037754668129815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,16384,0.4571173455980089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,10240,0.030244443151685927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,12288,0.3456879986657037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,16384,0.648347536722819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,8192,0.024572443630960252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,10240,0.29042667812771267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,12288,0.4928257730272081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,7168,0.021704889006084863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,51200,1.4020782046847875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,8192,0.2348933219909668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,10240,0.4133457872602675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,6144,0.019321777754359774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,65536,1.7918319702148438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,5120,0.016700444949997794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,8192,0.3349626594119602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,7168,0.20630755689409044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,4096,0.013927110367351107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,6144,0.17746844556596544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,7168,0.2959546777937147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,6144,0.2555866771274143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,5120,0.14636266231536865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,3584,0.012396444049146442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,5120,0.21228088272942436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,4096,0.11373778184254964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,4096,0.16885156101650664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,51200,1.9769102732340496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,3584,0.09772177537282307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,2560,0.010107555323176915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,3584,0.1482551097869873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,2048,0.008894222478071848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,3072,0.08388621939553155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,3072,0.1294800043106079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,1536,0.007654222349325816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,2560,0.07101333141326904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,2560,0.11097511317994858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,2048,0.09252355496088664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,2048,0.05735377470652262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,1024,0.006634666687912411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,768,0.005949333310127258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,1536,0.07267110877566867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,1536,0.04356000158521864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,512,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,1024,0.05572799841562907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,1024,0.03164622187614441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,768,0.026434666580624048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,256,0.004403555558787452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,768,0.047200000948376127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,128,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,512,0.020939555433061387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,512,0.038351999388800725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,64,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,256,0.02994489007525974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,256,0.016187555260128446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,32,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,128,0.02467022173934513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,128,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,64,0.01347733371787601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,65536,0.11290933026207818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,512,32,0.013443555268976422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,51200,0.08693599700927734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,16384,0.03502666619088914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,512,3072,0.011392888923486074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,16384,0.43868356280856663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,12288,0.02549155553181966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,16384,0.6457360055711534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,12288,0.33178665902879506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,10240,0.020747555626763236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,51200,1.3393706215752497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,12288,0.489731576707628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,10240,0.2784586747487386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,65536,1.7163040373060439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,7168,0.014832889040311178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,512,65536,2.52727296617296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,8192,0.22472800148857963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,6144,0.013645333548386892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,51200,1.9629156324598525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,8192,0.33305244975619847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,5120,0.012161778079138862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,7168,0.19788977834913465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,7168,0.2935724523332384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,6144,0.169685337278578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,4096,0.010262221925788457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,5120,0.14038756158616808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,6144,0.25407645437452525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,3584,0.009392889009581672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,5120,0.21073955959743926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,3072,0.008641777767075432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,4096,0.10891022284825642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,4096,0.16791910595364043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,2560,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,3584,0.09338044457965428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,3584,0.1472124391131931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,3072,0.07976355817582872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,3072,0.128711117638482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,8192,0.01720888912677765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,2560,0.06757955418692695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,2560,0.10987733470069037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,1536,0.005910222315125995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,1024,0.005102222164471944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,2048,0.054541332854164966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,2048,0.09181066354115804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,768,0.004575110971927643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,1536,0.07400888866848417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,1536,0.040248887406455144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,10240,0.41100888782077366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,1024,0.03018222252527873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,512,0.004217777815130022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,1024,0.05475199884838528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,256,0.003914666672547658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,768,0.025408888856569927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,768,0.04664177695910136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,512,0.02032711108525594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,128,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,64,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,256,0.02948533495267232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,32,0.0037786666717794207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,128,0.013431111143694984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,128,0.024479111035664875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,64,0.012748444245921241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,65536,0.08526044421725804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,32,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,65536,2.505562676323785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,51200,0.06855377886030409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,16384,0.027912888262006972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,256,2048,0.0069102222720781965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,16384,0.4275386598375108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,12288,0.017228444417317707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,256,512,0.037535998556349016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,256,256,0.015246222416559855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,10240,0.015512888630231222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,16384,0.643430233001709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,12288,0.3236044512854682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,8192,0.013346666263209449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,51200,1.3087760077582467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,10240,0.27204444673326283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,7168,0.011848889291286469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,65536,1.6718471315171983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,8192,0.21948711077372232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,6144,0.01072533345884747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,8192,0.33208976851569283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,7168,0.19316444132063124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,5120,0.009374221993817223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,6144,0.16556533177693686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,7168,0.2925848960876465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,4096,0.007962666451931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,5120,0.13658844100104436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,5120,0.21044445037841797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,4096,0.10630044672224258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,3584,0.0075457774930530125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,4096,0.16697777642144096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,65536,2.502082612779405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,3072,0.006607999818192587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,3584,0.09083288908004761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,3584,0.14649777942233616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,2560,0.005919111271699269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,3072,0.07779288954204984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,3072,0.1276693344116211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,12288,0.48854223887125653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,2048,0.005558222118351195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,2560,0.06566399998135038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,10240,0.410262213812934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,2560,0.1099662250942654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,2048,0.09127822187211777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,2048,0.05271910958819919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,1024,0.004295999805132548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,1536,0.07238222493065728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,768,0.0038808890514903595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,1024,0.029232889413833618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,1024,0.05453422334459093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,512,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,51200,1.9568409389919703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,768,0.024780443973011438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,256,0.0032319999817344877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,768,0.04620000057750278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,6144,0.2537715435028076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,128,0.003137777869900068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,256,0.02885599931081136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,256,0.014818666709793938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,128,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,32,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,64,0.0124195557501581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,32,0.012087999946541257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,65536,0.07833244403203328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,51200,0.06251466936535306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,128,1536,0.004883555488453971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,16384,0.025840888420740765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,1536,0.03867822223239475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,12288,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,10240,0.013426666458447775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,16384,0.4272293249766032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,128,512,0.019885333047972787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,12288,0.32349689801534015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,7168,0.011325333681371478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,10240,0.2719048923916287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,8192,0.21892800596025255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,6144,0.01034400032626258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,5120,0.008981333010726506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,7168,0.19266666306389701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,4096,0.00794222205877304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,6144,0.16533511214786106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,51200,1.307379510667589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,5120,0.1366915570365058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,3584,0.007259555160999298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,4096,0.10560355583826701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,2560,0.006007110906971826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,65536,1.672855059305827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,3584,0.09050933519999187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,3072,0.07739022043016222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,2048,0.005223111146026188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,1536,0.004866666677925321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,2560,0.0656577746073405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,1024,0.0041991112132867174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,768,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,1536,0.040404445595211454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,512,0.003528888854715559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,1024,0.029135998752382066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,512,0.037696888049443565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,256,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,768,0.02455733385350969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,8192,0.012724444270133972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,128,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,32,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,512,0.019865777757432725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,256,0.01484266585773892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,128,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,64,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,65536,0.07588533560434978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,32,0.012086222569147745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,16384,0.024724443753560383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,51200,0.06054044432110257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,12288,0.01221777747074763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,10240,0.011018666956159802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,64,3072,0.006583999842405319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,12288,0.32320888837178546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,8192,0.009686222506894005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,10240,0.2715182304382324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,16384,0.4269244405958388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,7168,0.009876444107956356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,6144,0.008737777670224508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,5120,0.011253332926167382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,8192,0.21891378031836617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,7168,0.19248799482981363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,6144,0.16549155447218153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,4096,0.009653333160612319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,64,2048,0.05255822340647379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,3584,0.008678221868144141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,5120,0.1364524496926202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,2560,0.007252444823582967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,4096,0.10552533467610677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,3072,0.0778906676504347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,2048,0.005214222189452913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,1536,0.004556444370084339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,2560,0.06595910920037164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,1024,0.0041893331540955436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,51200,1.309167120191786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,2048,0.052904887331856616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,1536,0.03891111082500882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,768,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,512,0.003548444559176763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,768,0.024705777565638225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,65536,1.6719670825534398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,512,0.01957155598534478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,256,0.0031395554542541504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,128,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,64,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,256,0.014800889624489678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,32,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,64,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,32,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3584,32,3072,0.007981333467695449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,3584,0.09062844514846802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,1024,0.02940000096956889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3584,32,128,0.0124177775449223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,12288,3.0566257900661893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,16384,4.274648878309462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,12288,3.6424844529893665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,10240,2.998678207397461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,16384,5.151394738091363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,8192,2.5071849822998047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,10240,2.9769102732340493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,8192,2.3370916578504777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,7168,1.9476356506347656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,7168,2.0101040734185114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,5120,1.3810017903645833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,6144,1.7527155346340602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,4096,1.0541004604763455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,6144,1.6927404403686523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,5120,1.4161333507961695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,3072,0.7578933503892687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,3584,0.9599901835123698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,3584,1.0204470952351887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,4096,1.1390150917900932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,3072,0.8434844546847873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,2560,0.6862008836534289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,1536,0.4145670996771918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,2048,0.5627519819471571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,2048,0.5830888748168945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,2560,0.7337404357062446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,1024,0.2952471044328478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,768,0.21322755018870035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,1536,0.5081297556559244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,512,0.1829519934124417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,1024,0.40600000487433535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,768,0.276309331258138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,256,0.133788439962599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,128,0.1080897781583998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,64,0.0785013304816352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,512,0.24068265491061738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,256,0.2225173314412435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,128,0.19547643926408556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,64,0.20037421915266249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,32,0.20654933982425264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,32,0.0822133355670505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,65536,51200,13.071705288357206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,16384,3.154520882500542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,16384,4.041026645236545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3584,128,128,0.023247111174795363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,12288,2.4763075510660806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,65536,51200,20.100267198350696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,12288,2.8786676194932728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,10240,2.377679189046224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,51200,9.959983825683594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,10240,2.266842736138238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,8192,1.615428394741482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,8192,1.8919857872856989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,7168,1.4139715830485027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,6144,1.2700604332817924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,6144,1.3515653610229492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,7168,1.610664897494846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,5120,1.16447205013699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,4096,0.9551031324598523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,5120,1.1412311130099826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,3584,0.7094782193501791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,65536,12.935956319173178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,3072,0.7166630956861707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,4096,0.8874888949924045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,3072,0.6744871139526367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,3584,0.9617360432942709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,2560,0.5636026594373915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,1536,0.29903022448221844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,2048,0.45299376381768125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,1536,0.37743910153706867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,1024,0.2606168852912055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,768,0.18745688597361246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,512,0.155276444223192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,1024,0.28267023298475474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,2560,0.5905920134650336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,768,0.22297422091166177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,256,0.12675110499064127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,512,0.2125991053051419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,128,0.07589866717656453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,64,0.0741644435458713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,51200,32,0.06707377566231622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,256,0.16634666919708252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,128,0.1566186613506741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,64,0.16369777255588108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,32,0.17968089050716826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,2048,0.4685520066155328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,16384,1.0016203986273873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,12288,0.8309049076504178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,51200,17.218065049913196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,16384,1.520409795973036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,51200,3.5524453057183156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,10240,0.7876044379340278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,12288,1.1642577913072374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,65536,4.356152004665799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,8192,0.6401395797729492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,10240,0.9067991044786242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,7168,0.49640798568725586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,6144,0.5464115672641331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,8192,0.9475733439127604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,6144,0.5343066851298014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,5120,0.363555563820733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,7168,0.6521173583136665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,4096,0.2982746760050456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,3584,0.28918221261766225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,3072,0.2053635517756144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,4096,0.34978400336371523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,5120,0.487594657474094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,3584,0.3131173451741536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,2560,0.18884978029463026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,2048,0.14155022303263345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,1536,0.12047378222147624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,3072,0.34567732281155056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,2048,0.18669244978162977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,1024,0.0859031081199646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,768,0.059552000628577344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,1536,0.15290666951073542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,512,0.051106668180889554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,256,0.03347200155258179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,1024,0.1437013281716241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,51200,6.1952667236328125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,128,0.03013066781891717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,64,0.02604088849491543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,256,0.06423022349675496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,768,0.10087733136283027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,51200,65536,20.835600111219616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,16384,32,0.025455110602908667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,128,0.06351288821962145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,64,0.06126755475997925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,32,0.06356088982688056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,2560,0.22734043333265516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,16384,0.776584890153673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,65536,7.734850565592448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,16384,512,0.0765262246131897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,12288,0.6115244229634603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,10240,0.4670995606316461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,16384,1.2152178022596571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,12288,0.9204924901326498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,8192,0.396179543601142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,7168,0.3613475428687201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,10240,0.8028586705525717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,51200,2.5250559912787542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,8192,0.5865137841966417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,7168,0.5689679781595866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,6144,0.30416978730095756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,5120,0.2787706587049696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,4096,0.1934960020913018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,6144,0.4459688928392198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,5120,0.3645431200663249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,3584,0.20320799615648058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,65536,3.1875777774386935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,3072,0.15595822864108616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,4096,0.3382897906833225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,2560,0.14123733838399252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,2048,0.10751377873950535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,3584,0.28358133633931476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,3072,0.2174746725294325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,1536,0.09146310885747273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,1024,0.059007108211517334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,768,0.0583911140759786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,2560,0.23644622166951498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,512,0.043423109584384494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,1536,0.12195377879672581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,1024,0.0917288859685262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,256,0.03331022130118476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,768,0.07652799950705634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,128,0.020966221888860066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,64,0.018170666363504197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,12288,32,0.018392889036072623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,128,0.05708089139726427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,512,0.06320177846484713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,64,0.04807466599676344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,32,0.04925600025388929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,2048,0.16532088650597468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,51200,4.850449879964192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,256,0.05742400222354465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,16384,0.6274888780381944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,12288,0.4775724411010742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,51200,2.0388399759928384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,12288,65536,6.208179473876953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,16384,1.104615953233507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,10240,0.444992913140191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,8192,0.3467235565185547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,12288,0.869676431020101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,7168,0.3165253268347846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,65536,2.669609705607096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,10240,0.678542243109809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,8192,0.5250417921278212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,6144,0.290446228451199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,5120,0.21094577842288545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,7168,0.5234870910644531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,4096,0.19010844495561388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,6144,0.4656666649712457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,5120,0.32433422406514484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,3584,0.15429066287146673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,3072,0.12518310546875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,2560,0.106949335998959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,4096,0.2619413269890679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,3584,0.2640542189280192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,2048,0.09524444739023845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,1536,0.0695564415719774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,3072,0.19390043947431776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,2560,0.16928444968329537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,1024,0.04625599914126926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,768,0.038542220989863075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,2048,0.13782310485839844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,512,0.027053332991070215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,1536,0.11963466803232829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,1024,0.0816826687918769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,256,0.021531555387708876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,768,0.06860799921883477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,128,0.018920888503392536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,64,0.016157334049542744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,512,0.05551822317971123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,10240,32,0.016168889072206285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,256,0.04739288820160759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,128,0.04105955693456862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,64,0.04110399881998698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,32,0.04072177741262648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,51200,4.207575056287977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,16384,0.5121439827813042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,10240,65536,5.235284593370226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,12288,0.4183608955807156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,16384,0.9452666176689996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,10240,0.3634346591101752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,8192,0.29817154672410756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,51200,1.618035528394911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,10240,0.5738311343722874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,7168,0.27256443765428334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,65536,2.1457608540852866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,8192,0.534124427371555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,6144,0.23010667165120444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,7168,0.42341332965426975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,5120,0.1856142282485962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,4096,0.14133955372704401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,6144,0.4658186700608995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,3584,0.13229689333173963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,5120,0.29270844989352757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,4096,0.22654578420850965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,3072,0.13057422637939453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,2560,0.08719733026292588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,3584,0.2405946784549289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,2048,0.09100355704625447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,3072,0.19678933090633818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,1536,0.06370844443639119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,2560,0.1461306677924262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,1024,0.04390844371583727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,2048,0.1207617786195543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,512,0.023874666955735948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,1536,0.0985528892940945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,1024,0.0800044470363193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,256,0.018793778287039865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,768,0.060884442594316274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,128,0.015577778220176697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,12288,0.7033413251241049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,512,0.047120889027913414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,64,0.013343111508422427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,256,0.04145333170890808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,32,0.012834666503800286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,128,0.035749332772360906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,64,0.03371644351217482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,32,0.03395377927356296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,51200,3.5501653883192272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,16384,0.4606871075100369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,8192,768,0.032630221711264715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,12288,0.36765866809421116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,8192,65536,4.341756608751085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,16384,0.8746213383144803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,10240,0.3262133333418104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,8192,0.23828887939453125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,51200,1.5300959481133356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,12288,0.6398337682088217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,10240,0.5423955387539333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,7168,0.20843999915652803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,65536,1.8913938734266493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,6144,0.17235822147793242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,5120,0.16239110628763834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,8192,0.469321780734592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,4096,0.11840532885657416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,7168,0.40530843204922146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,3584,0.11042577690548366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,6144,0.3248702155219184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,3072,0.0916995538605584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,5120,0.2802293300628662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,2560,0.082205335299174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,4096,0.2363635434044732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,3584,0.18674222628275552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,2048,0.06037244531843397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,3072,0.16003999445173475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,1536,0.04610310991605123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,2560,0.13809866375393337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,1024,0.032680001523759626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,768,0.026416889495319788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,2048,0.12253599696689182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,512,0.020783111453056335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,1536,0.08918044302198623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,256,0.01587733295228746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,128,0.013462222284740873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,512,0.043896890348858304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,256,0.035176889763938055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,64,0.012608889076444836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,128,0.031545778115590416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,7168,32,0.013194666968451606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,32,0.03075466553370158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,51200,3.1226471794976125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,65536,3.9975323147243924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,1024,0.06804711288876004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,768,0.05380710959434509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,12288,0.3177831172943115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,16384,0.38891643948025173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,7168,64,0.031159109539455835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,51200,1.3392186694675023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,10240,0.2378693421681722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,16384,0.7898284594217936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,65536,1.822757297092014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,12288,0.6111084620157877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,7168,0.18790755007002088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,8192,0.40841955608791775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,6144,0.1518711116578844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,7168,0.36408178011576336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,5120,0.1244586706161499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,6144,0.29610223240322536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,4096,0.10104711188210382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,3584,0.09780177805158828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,5120,0.24636620945400664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,4096,0.19208178255293104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,3072,0.0790826678276062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,3584,0.1695822212431166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,2048,0.05172444383303324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,2560,0.12760710716247559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,1536,0.03926755653487311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,8192,0.19999378257327607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,2048,0.10416622294320001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,1024,0.027313777142100867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,768,0.022533333963818018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,1536,0.08300977945327759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,1024,0.06096888913048638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,512,0.017645332548353408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,256,0.013794666363133324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,768,0.04979644550217522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,128,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,512,0.03888622257444594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,256,0.030932443009482488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,64,0.010335110955768162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,32,0.011020444333553314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,128,0.028584887584050495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,64,0.028452446063359577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,51200,2.888011508517795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,32,0.0281315545241038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,6144,2560,0.06741244263119169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,3072,0.1443208853403727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,16384,0.27960533565945095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,10240,0.48977332644992405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,12288,0.21836088763342965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,10240,0.19212267133924696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,16384,0.7198017968071831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,51200,1.1229226854112413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,6144,65536,3.6839574178059897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,8192,0.16423200236426458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,12288,0.5355306731330024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,7168,0.14375555515289307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,6144,0.12416177325778538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,10240,0.46036979887220597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,8192,0.4464569091796875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,5120,0.10343911250432332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,7168,0.3321404457092285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,4096,0.10439199871487087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,3584,0.07849244276682536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,6144,0.272145774629381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,3072,0.06325599882337782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,5120,0.22574400901794434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,4096,0.17452000247107613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,2560,0.05754399961895413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,2048,0.04365244507789612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,3584,0.15529421965281168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,1536,0.03415377934773763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,3072,0.1324382225672404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,1024,0.023989333046807185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,2560,0.11311111185285781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,768,0.019966221517986722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,2048,0.09530044264263576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,512,0.014727110664049784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,1536,0.07682489024268256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,256,0.0114702218108707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,1024,0.05405066741837395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,768,0.04522666666242811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,128,0.01070844464831882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,512,0.034994665119383074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,64,0.00963288876745436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,256,0.028519110547171697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,65536,1.4273618062337239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,51200,2.537817849053277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,128,0.02596355477968852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,64,0.025714667307005987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,32,0.02535022298494975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,16384,0.2805946667989095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,5120,65536,3.339817682902018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,51200,0.7234426604376899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,12288,0.20719644758436415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,65536,1.0350542068481445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,16384,0.6660657988654243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,5120,32,0.009682666924264696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,8192,0.1457137796613905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,12288,0.528914663526747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,7168,0.1227946678797404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,10240,0.503984875149197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,8192,0.32848887973361546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,6144,0.109424889087677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,5120,0.08941866954167683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,7168,0.2937893337673611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,4096,0.07327289051479764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,6144,0.25909866227044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,3584,0.063028441535102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,5120,0.216592894660102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,3072,0.05154933200942146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,4096,0.1588817834854126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,2560,0.04727288749482897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,2048,0.03859822286499871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,3584,0.13955999745262995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,3072,0.12388532691531712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,1536,0.0277839998404185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,1024,0.020900444851981267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,51200,2.230883492363824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,2560,0.1022791133986579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,768,0.017596445149845548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,512,0.013919111755159167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,10240,0.20506489276885986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,256,0.010103111465771994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,1536,0.06807821989059448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,1024,0.04885422190030416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,128,0.00868977771864997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,64,0.007664889097213745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,768,0.04095822241571214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,512,0.03160266743765937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,4096,32,0.007598222129874759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,256,0.02513422237502204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,128,0.023401778605249193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,64,0.023318222827381555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,32,0.022632888621754114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,65536,2.8908292982313366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,16384,0.226311100853814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,12288,0.17765243848164877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,10240,0.17759644985198975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,51200,0.7319724294874402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,65536,0.8224248886108398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,16384,0.6175653139750162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,12288,0.47536802291870117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,7168,0.11496978335910374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,8192,0.1660755607816908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,6144,0.09647288587358262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,5120,0.08101689153247409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,10240,0.41164978345235187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,7168,0.278860436545478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,6144,0.2946515613132053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,4096,0.06311644448174371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,3584,0.07077866792678833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,5120,0.19408533308241102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,4096,0.1511333386103312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,3072,0.062296887238820396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,2560,0.04191022117932638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,2048,0.034713778230879046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,3072,0.11425599786970352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,2560,0.12733066082000732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,1536,0.02680977847841051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,1024,0.017881777551439073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,2048,0.07966133621003893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,768,0.014083556003040738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,1536,0.06487733125686646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,51200,2.075259526570638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,1024,0.04597244328922696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,512,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,256,0.009012444151772393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,768,0.0391813317934672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,128,0.007941332956155142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,64,0.007260444263617198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,512,0.029853334029515583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,256,0.024068444967269897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,128,0.021993777818149988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3584,32,0.007291555404663086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,64,0.02160177793767717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,8192,0.3625626564025879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,32,0.021426666114065383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,65536,2.6511751810709634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,16384,0.22398667865329316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3584,3584,0.13490045070648193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,12288,0.1693342261844211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,51200,0.6481048795912001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,16384,0.5779226620992025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,65536,0.8391608662075467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,10240,0.13679467307196722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,8192,0.11502844757503933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,4096,2048,0.0837857789463467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,7168,0.10220977995130752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,12288,0.43529865476820206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,6144,0.08931733502282037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,10240,0.3669404453701443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,8192,0.3369973235660129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,5120,0.0754400028122796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,7168,0.26041332880655926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,4096,0.05695288711123996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,3584,0.04439999990993076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,6144,0.22239287694295248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,3072,0.037668443388409086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,5120,0.18304710918002656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,2560,0.03197866678237915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,4096,0.16742932796478271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,2048,0.02652799917591943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,3584,0.13525511158837214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,1536,0.021924444370799597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,1024,0.01590844492117564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,2560,0.09218755695554946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,768,0.012993777791659037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,2048,0.07937688959969415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,1536,0.0579893324110243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,512,0.010383110907342698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,1024,0.0431253347131941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,256,0.008241777618726095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,51200,1.9131724039713542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,128,0.007269333634111617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,768,0.03583644496070014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,64,0.006566222343179915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,512,0.028296000427669946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,3072,32,0.0069288888739215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,256,0.02240088913175795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,128,0.020599111914634705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,64,0.019896888070636325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,32,0.020239111449983384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,65536,2.415175120035807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,16384,0.1587537791993883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,12288,0.12023999955919053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,51200,0.428546667098999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,65536,0.6272720230950249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,10240,0.1132613288031684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,8192,0.07680266433291964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,3072,3072,0.10875911182827419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,16384,0.5444284545050727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,7168,0.07183288865619235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,12288,0.41379110018412274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,6144,0.06160622172885471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,5120,0.05202755663130018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,10240,0.38597599665323895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,4096,0.04375822345415751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,8192,0.2838462193806966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,7168,0.245598210228814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,3584,0.038451555702421404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,6144,0.21033777130974662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,3072,0.033844444486829973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,5120,0.1738871071073744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,2560,0.03147466646300422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,4096,0.1438195572959052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,2048,0.025608888930744592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,1536,0.02199733257293701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,3584,0.12020444869995117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,2560,0.08705244461695354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,1024,0.01677955521477593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,2048,0.07071733474731445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,768,0.01274222218328052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,1536,0.05440622236993578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,512,0.010496888723638324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,256,0.008294222255547842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,1024,0.0406675570540958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,768,0.03565244542227851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,128,0.006568888823191325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,64,0.006252444452709622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,512,0.026714666022194758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,256,0.021135111649831135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,51200,1.7509849336412218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,128,0.019211555520693462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,64,0.018650665879249573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,32,0.01890222231547038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,16384,0.13163110944959852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,65536,2.2516863081190324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,51200,0.37955466906229657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,65536,0.4795697530110677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,12288,0.1027208897802565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,10240,0.0915493302875095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,8192,0.07236622439490424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2560,3072,0.10252622101042007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,16384,0.5142835511101617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,12288,0.424366209242079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,10240,0.32741332054138184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,6144,0.05458133419354757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,8192,0.2862702210744222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,5120,0.04458489020665487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,7168,0.23225511444939506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,4096,0.03522933191723294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,6144,0.19877955648634169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,3584,0.03194222185346816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,5120,0.17042756080627441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,3072,0.028061333629820082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,4096,0.1271173291736179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,2560,0.024080889092551336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,3584,0.11124089029100205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,51200,1.6211741765340169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,3072,0.09677066405614217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,1536,0.01568177839120229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,2560,0.08156444629033406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,1024,0.011873777541849347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,2048,0.06770310799280803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,1536,0.05341955688264635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,768,0.01000355515215132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,512,0.00794044468137953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,65536,2.0740648905436196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,1024,0.03704977697796292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,768,0.03199288911289639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,256,0.006584888945023219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,7168,0.0625680022769504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,128,0.005633777628342311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,64,0.005210666606823604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,32,0.00554577757914861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,256,0.019868445065286424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,128,0.017852443787786696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,64,0.01722400055991279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2560,32,0.0069102222720781965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,32,0.017180444465743173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,16384,0.10927377806769477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,65536,0.43685065375434023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,51200,0.32940533426072865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,12288,0.08182755443784925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,2048,2048,0.01982133256064521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,10240,0.07376622491412692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,8192,0.06317866510815091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,16384,0.48469866646660703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,12288,0.37229511472913956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,7168,0.05350311266051399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,10240,0.30743998951382107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,6144,0.0417902237839169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,5120,0.03797422183884515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,2048,512,0.024904888537194993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,8192,0.2777528762817383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,4096,0.029666665527555678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,6144,0.1868293285369873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,3584,0.02624711063173082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,5120,0.15376710891723633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,3072,0.023004444109068975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,2560,0.020337777005301583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,3584,0.1040159993701511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,3072,0.09046577745013767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,2048,0.017318222257826064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,51200,1.497285313076443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,2560,0.0766213337580363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,1536,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,1024,0.01015822258260515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,768,0.00868266655339135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,2048,0.0634488860766093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,1536,0.04890844557020399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,1024,0.03463200065824721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,256,0.005960888746711943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,65536,1.9141271379258897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,128,0.005224888937340842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,512,0.023356444305843774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,64,0.004574222283230888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,256,0.018572444717089336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,32,0.004878222114510006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,128,0.01668355531162686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,64,0.016131555040677387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,32,0.015858666764365304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,65536,0.2899911138746473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,7168,0.219032883644104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,51200,0.2305555608537462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,16384,0.07431911097632514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,12288,0.05799466371536255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,4096,0.12632089191012913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,10240,0.05145244465933906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,8192,0.0403093331389957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,12288,0.3541911178165012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,16384,0.4519057803683811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,7168,0.03189244535234239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,10240,0.28698934449089897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,6144,0.027277333868874445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,8192,0.24886933962504068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1536,512,0.006955555743641323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,5120,0.0236791107389662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1536,768,0.02968177861637539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,3584,0.017495110630989075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,7168,0.20368711153666177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,6144,0.17404888735877144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,5120,0.14608177873823378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,3072,0.016064888901180692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,4096,0.1144968933529324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,2560,0.013985777894655863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,2048,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,1536,0.009714666340086196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,3584,0.09650666846169366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,3072,0.08428088823954265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,2560,0.0712640020582411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,1024,0.007617777420414819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,2048,0.05740000141991509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,768,0.006623999940024481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,1536,0.04583377639452616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,512,0.0058711109062035876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,256,0.004903111192915174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,1024,0.031896889209747314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,768,0.027635556128289964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,128,0.004514666481150521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,512,0.021993777818149988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,64,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,256,0.017267554998397827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,65536,1.7730844285753038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,128,0.015120888749758402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,64,0.015111999379263984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,32,0.014831999937693277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,65536,0.21856533156500924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,51200,0.2031031052271525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,16384,0.06468711296717326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,4096,0.01956977778010898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,12288,0.04820355441835192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,10240,0.04001511136690775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,16384,0.43949066268073184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,12288,0.3330559995439318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,8192,0.030454221698972914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,1024,51200,1.393900447421604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,7168,0.027552000350422327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,6144,0.024140444066789415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,8192,0.22582401169670951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,1024,32,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,7168,0.1981519990497165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,4096,0.018187556001875136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,5120,0.13901510503556994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,51200,1.3474675284491644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,3584,0.016294222739007738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,3072,0.014300444059901767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,65536,1.7226773367987738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,3072,0.08160444762971666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,2560,0.012911111116409302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,2048,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,2560,0.06912977827919854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,1536,0.009295110901196798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,10240,0.2817591031392415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,2048,0.05574666791492038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,1024,0.007364444434642792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,768,0.006530666516886816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,512,0.005561777700980504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,1536,0.04301155606905619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,768,0.026737777723206416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,1024,0.031173331869973078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,256,0.004874666531880696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,128,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,512,0.021390222840838965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,64,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,5120,0.021529777182473078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,768,32,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,6144,0.16963022285037568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,128,0.014452444182501899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,64,0.014105778601434497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,32,0.013758222262064615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,65536,0.17266578144497344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,51200,0.14493244224124485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,16384,0.04673599865701464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,4096,0.10827910900115967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,12288,0.03475288881195916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,10240,0.02759733299414317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,8192,0.021710221966107685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,3584,0.09407111008961995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,7168,0.01919555498494042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,12288,0.31824978192647296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,10240,0.26783643828497994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,16384,0.41985156801011825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,6144,0.01703733371363746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,5120,0.015124445160230001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,8192,0.21590399742126465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,4096,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,3584,0.011361777782440186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,7168,0.18962577978769937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,3072,0.010709332923094431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,6144,0.1626853280597263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,5120,0.13338489002651638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,4096,0.10312622123294407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,2560,0.00903555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,2048,0.008303999900817871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,3584,0.08921155664655898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,1536,0.00638488887084855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,1024,0.005576888720194499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,3072,0.07768622371885511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,2560,0.06522578001022339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,2048,0.052433778842290245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,768,256,0.016206221448050607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,1536,0.04000622365209792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,512,0.004238222208287981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,256,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,1024,0.02960088849067688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,128,0.0035573335157500375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,768,0.02548800077703264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,51200,1.287125375535753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,64,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,32,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,512,0.020243555307388306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,256,0.015471110741297403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,128,0.013781333135233985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,64,0.013401777380042605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,65536,0.10319466723336114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,32,0.013108444710572561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,51200,0.08323022392061022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,512,65536,1.6443662643432617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,16384,0.03291822142071194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,12288,0.021867555048730638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,10240,0.017258667283587985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,8192,0.014532445205582513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,12288,0.30984534157647026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,10240,0.2602693239847819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,16384,0.40924800766838926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,8192,0.21017955409155953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,7168,0.013233777549531726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,6144,0.011521778172916837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,5120,0.01034755590889189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,4096,0.008962666822804345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,7168,0.18472088707817924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,6144,0.15818577342563206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,512,768,0.004905777672926585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,5120,0.12957421938578287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,4096,0.10047377480400933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,3072,0.0076453329788313965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,2560,0.006913777854707506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,2048,0.0059075554211934405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,3584,0.08662133084403144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,3072,0.07516888777414958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,1536,0.005232000102599462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,2560,0.06336000230577257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,1024,0.004502222355869082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,2048,0.05095200075043572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,768,0.004325333154863781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,51200,1.2505253685845268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,512,0.0038773334688610504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,1536,0.039649777942233615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,256,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,128,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,1024,0.028677334388097126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,768,0.02502044373088413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,64,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,512,0.01979377700222863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,32,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,256,0.015035554766654968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,128,0.013081777426931592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,65536,0.07632444302241008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,64,0.013017777767446307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,32,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,51200,0.06206755505667793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,16384,0.026006221771240234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,12288,0.016580444243219163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,10240,0.014807111687130399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,12288,0.3021706740061442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,256,3584,0.00832088871134652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,16384,0.3988622294531928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,8192,0.013160000244776407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,10240,0.25380444526672363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,7168,0.011876444849703046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,6144,0.010623111493057676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,5120,0.009531555904282464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,4096,0.00796088907453749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,8192,0.20480799674987793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,7168,0.17995199892255995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,6144,0.1540000041325887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,5120,0.1258266634411282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,3072,0.006617777877383762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,2560,0.006269333263238271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,4096,0.09722310966915554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,3584,0.08472088972727458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,256,65536,1.5993661880493164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,3072,0.07273955477608575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,1536,0.004932444542646408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,2560,0.06155822012159559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,51200,1.2181857426961262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,1024,0.00423555572827657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,2048,0.048727999130884804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,768,0.003930666794379552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,1536,0.03666933377583822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,256,0.0032808888289663526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,1024,0.027767111857732136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,768,0.024106666445732117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,65536,1.5575182172987196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,128,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,512,0.01923022170861562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,64,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,32,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,256,0.014194667339324951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,64,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,32,0.012100444071822695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,51200,0.05942489041222466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,16384,0.02308799988693661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,3584,0.007302222152551015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,12288,0.01482222146458096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,16384,0.39868799845377606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,2048,0.005574222240183089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,10240,0.012710221939616732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,12288,0.3016435570187039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,128,512,0.003539555602603488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,8192,0.01107911103301578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,10240,0.2533173296186659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,7168,0.01036533299419615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,6144,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,65536,0.07093244128757052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,5120,0.009684444301658207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,51200,1.2171440124511719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,7168,0.17971466647254097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,4096,0.007834666305118138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,6144,0.1539333396487766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,3584,0.007253333098358578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,3072,0.006614222294754452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,65536,1.5587644577026367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,2560,0.006228444476922353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,4096,0.09707822402318318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,2048,0.005294222384691238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,3584,0.08422666788101196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,3072,0.07283555799060397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,1536,0.005040888984998067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,1024,0.0041653331783082755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,2560,0.0613466633690728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,768,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,1536,0.03667111198107401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,512,0.0033315554675128725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,768,0.0240631103515625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,256,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,512,0.0192248887485928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,128,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,256,0.014138667119873894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,64,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,128,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,64,32,0.0032222221295038858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,8192,0.20475110742780897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,64,0.012038222617573209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,65536,0.07380000087949964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,32,0.012083555261294046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,51200,0.05818133221732246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,16384,0.022335110439194575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,5120,0.12656711207495794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,12288,0.01309333327743742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,2048,0.04845866560935974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,10240,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,64,1024,0.027533332506815594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,16384,0.39889687962002224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,8192,0.013811555173661975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,12288,0.30184443791707355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,7168,0.00942844483587477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,6144,0.009018667042255402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,10240,0.25357866287231445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,8192,0.204675555229187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,5120,0.008607111043400234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,7168,0.17965688970353869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,4096,0.009707555174827576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,3584,0.008662222160233391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,6144,0.15366310543484157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,128,128,0.012673777838548025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,2560,0.007258666886223688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,4096,0.0975102252430386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,5120,0.1259511046939426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,3584,0.08474044667349921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,2048,0.005250666704442766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,3072,0.07274044222301908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,1536,0.004885333279768626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,1024,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,2560,0.06181510951783922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,768,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,512,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,2048,0.048269334766599864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,1536,0.03684622380468581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,256,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,1024,0.027934223413467407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,65536,1.559041765001085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,128,0.0028888889484935333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,768,0.024188444018363953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,64,0.002551111082235972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,512,0.01923644377125634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,32,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,256,0.014303111367755465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,128,0.0123848890264829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,64,0.012348444097571902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,32,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3329,32,3072,0.007982222570313348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3329,32,51200,1.2170328564114041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,12288,3.1421065860324435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,16384,4.238872951931424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,12288,3.558585696750217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,16384,4.962089962429471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,16384,4.541673024495442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,10240,2.821427451239692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,10240,2.919823964436849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,12288,3.329256057739258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,8192,2.4336995018853083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,10240,2.7870559692382812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,8192,2.3122177124023438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,7168,2.0090870327419705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,8192,2.2765644921196833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,7168,1.9510186513264973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,6144,1.622072007921007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,7168,1.973782221476237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,5120,1.2706836064656575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,6144,1.6698826683892145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,51200,12.703529357910156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,6144,1.7038657930162218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,5120,1.3932391272650824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,4096,1.0782835218641493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,4096,1.114874627855089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,3584,0.9103511174519857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,5120,1.394600020514594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,3584,0.9531182183159722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,4096,1.1430186165703666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,3072,0.7786373562282987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,3584,0.919256846110026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,3072,0.9416187074449328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,2560,0.7546248965793185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,2048,0.5048577520582411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,3072,0.8518986701965332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,2048,0.5794977611965603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,2560,0.688211547003852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,1536,0.43161866399976945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,1536,0.4827902052137587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,2560,0.6355928844875759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,1024,0.2786622312333849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,2048,0.5761937565273708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,1536,0.4424977832370334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,1024,0.44242133034600156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,512,0.15572978390587702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,768,0.2871608999040392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,512,0.26460443602667916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,256,0.12331999672783746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,512,0.2553848955366346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,128,0.09694488843282063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,256,0.20628000630272758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,256,0.1755982240041097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,64,0.07610578007168241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,128,0.13504532972971597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,128,0.1973715490765042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,32,0.08525866932339138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,64,0.19863288932376436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,65536,768,0.21170400248633492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,32,0.1999244425031874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,1024,0.3357146581013997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,768,0.31477512253655326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,65536,51200,15.011591593424479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,65536,51200,21.153227064344616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,16384,3.470841725667318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,16384,3.9527325100368924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,12288,2.4518985748291016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,51200,10.016981336805555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,16384,3.6183077494303384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,65536,12.825959947374132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,12288,2.8190729353162975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,10240,2.1381403605143228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,12288,2.671237309773763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,10240,2.380326165093316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,8192,1.8291572994656031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,10240,2.274203618367513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,51200,15.9632568359375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,8192,1.895367940266927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,7168,1.543532477484809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,7168,1.6058088938395183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,6144,1.3260559505886502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,8192,1.752165370517307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,51200,12.352377997504341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,7168,1.5664328469170465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,5120,1.0314737955729167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,6144,1.365832010904948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,4096,0.755290667215983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,5120,1.1374186409844291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,6144,1.3673067092895508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,3584,0.6853982077704536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,5120,1.051020410325792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,4096,0.9422328737046984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,3584,0.7700835333930122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,4096,0.8739911185370551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,3072,0.5917538007100424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,65536,20.58253648546007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,2560,0.4983821974860297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,3584,0.765175978342692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,2560,0.6025324397616917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,3072,0.663864877488878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,2048,0.4574613571166992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,1536,0.2769013245900472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,65536,15.760092841254341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,2048,0.544141345553928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,1536,0.3791768815782335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,2560,0.5648053487141927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,1024,0.21183644400702584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,2048,0.4772373305426703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,768,0.17085956202612984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,512,0.13668621910942927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,1536,0.48423290252685547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,1024,0.2807519965701633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,768,0.27456622653537327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,256,0.09497955772611831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,3072,0.6878222359551324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,512,0.1845839950773451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,1024,0.3686666753556993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,512,0.19295644760131836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,128,0.07566577858395047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,768,0.22257423400878906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,256,0.16415377457936606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,64,0.06132355663511488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,256,0.15621333652072483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,51200,128,0.11035111215379502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,51200,32,0.06192533175150553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,128,0.15349777539571127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,64,0.15888355837927923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,51200,32,0.1576497819688585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,16384,1.0533101823594835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,16384,1.5033928553263347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,51200,3.208822250366211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,12288,0.7899280124240451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,65536,4.099177890353732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,12288,1.0967013041178386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,16384,1.528251541985406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,10240,0.7620088789198133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,12288,1.1035679711235893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,10240,0.8962666193644205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,8192,0.6329030990600586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,10240,0.9106302261352539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,51200,6.204520755343967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,7168,0.5646124415927464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,8192,0.7247324519687228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,51200,4.8664194742838545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,8192,0.7283493147956001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,7168,0.6287093162536621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,6144,0.43736712137858075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,6144,0.5283208953009711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,5120,0.2972124417622884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,4096,0.2605457835727268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,7168,0.6573217709859213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,5120,0.4410906632741292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,4096,0.3538542323642307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,6144,0.5779653125339085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,3584,0.23625066545274523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,65536,7.5714060465494795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,3584,0.30163200696309406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,3072,0.20069421662224662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,4096,0.37854401270548504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,2560,0.16353332996368408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,3584,0.33150490125020343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,3072,0.26759288046095103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,2560,0.23138401243421766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,2048,0.13241510921054417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,3072,0.30336178673638237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,65536,6.287047915988499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,2560,0.2508311006757948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,1536,0.10991377962960137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,1024,0.07703022162119548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,2048,0.18471022446950278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,768,0.06030133035447863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,1536,0.1658008893330892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,1024,0.11019200086593628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,1024,0.12993155585394964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,768,0.08876444233788384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,768,0.11761955420176189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,256,0.0310808883772956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,512,0.08749155865775214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,512,0.07438577546013726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,128,0.027503111296229895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,256,0.06554222106933594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,256,0.06924800078074138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,64,0.022107554806603327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,128,0.05380710959434509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,32,0.02271555529700385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,64,0.060657779375712075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,32,0.06012711260053846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,2048,0.21426755852169463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,1536,0.14748088518778482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,16384,512,0.04301333427429199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,16384,5120,0.5063858032226562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,16384,128,0.059317330519358315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,16384,0.8058311144510905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,16384,1.1998702155219185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,51200,2.527198155721029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,65536,3.1557786729600696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,12288,0.5967395570543077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,10240,0.5379733509487575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,16384,1.2501618067423503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,12288,0.9108240339491102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,12288,0.919473754035102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,8192,0.4112951225704617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,10240,0.8298186726040311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,10240,0.7746879789564344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,7168,0.36210044225056964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,8192,0.5811973147922093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,7168,0.5073297818501791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,51200,4.772783915201823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,6144,0.26902932590908474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,8192,0.6411662101745605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,5120,0.22631822692023384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,51200,3.9796986050075955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,7168,0.5728675524393717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,6144,0.4330551094479031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,5120,0.3640720049540202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,6144,0.4949733416239421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,65536,6.253534105088975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,4096,0.2851395606994629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,3584,0.16466311613718668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,4096,0.3161999914381239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,5120,0.42730045318603516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,3072,0.13319999641842312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,3584,0.2553173436058892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,65536,5.174226548936632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,2560,0.11318933963775635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,3584,0.309663110309177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,2048,0.09179111321767171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,3072,0.24933687845865884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,2560,0.18610933091905382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,1536,0.07788622379302979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,2560,0.22654400931464302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,2048,0.1782346698972914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,2048,0.15443110466003418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,1024,0.056736886501312256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,1536,0.12043733066982693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,768,0.04306844539112515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,1024,0.09250399801466201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,1024,0.10976711246702407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,4096,0.21176444159613717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,512,0.03313066562016805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,768,0.07379555702209473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,256,0.025055110454559326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,512,0.061398221386803516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,128,0.022310222188631695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,256,0.051629334688186646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,512,0.0731368859608968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,64,0.01905333333545261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,128,0.04717955655521817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,12288,32,0.01982222166326311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,64,0.048078222407235034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,3072,0.21583733293745253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,32,0.048800001541773476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,1536,0.14102221859825984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,768,0.09193955527411567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,12288,256,0.05663466453552246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,12288,128,0.047896001074049205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,16384,0.7156391143798828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,16384,1.059310171339247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,51200,2.0520551469590926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,65536,2.680823008219401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,12288,0.5043902397155762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,12288,0.7913395563761393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,16384,1.1523751152886283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,12288,0.8627680142720541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,10240,0.6494613223605686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,8192,0.365955564710829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,10240,0.7177982330322266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,10240,0.47213157018025714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,51200,4.059174431694879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,7168,0.3157546785142687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,8192,0.5160417556762695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,8192,0.6016257603963217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,6144,0.26797954241434735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,65536,5.096475389268663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,7168,0.4509858025444879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,6144,0.3873884412977431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,5120,0.22755556636386445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,51200,3.6171696980794272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,7168,0.5256133079528809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,4096,0.1549582216474745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,5120,0.3635671138763428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,3584,0.16010488404168025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,5120,0.36457867092556423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,3072,0.12670844131045872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,3584,0.22026399771372476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,4096,0.30967556105719674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,65536,4.736829121907552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,3584,0.2682933277553982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,2560,0.10616088575787014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,3072,0.1917519966761271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,3072,0.2515724500020345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,2560,0.16666844156053331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,1536,0.06979466809166802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,2048,0.13566844993167454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,2048,0.1630071136686537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,1024,0.04669244421852959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,1536,0.10840533177057902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,1536,0.1350275543000963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,768,0.038725333081351385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,1024,0.10015910863876343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,1024,0.08124177985721164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,512,0.028245333168241713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,768,0.0838586688041687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,256,0.027095110880004034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,512,0.05412888858053419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,512,0.06781955560048421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,6144,0.442521784040663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,128,0.018650665879249573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,4096,0.3159688843621148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,256,0.04522844486766391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,64,0.01566488875283135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,128,0.04276266694068909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,128,0.04104177819357978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,32,0.015812445018026564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,64,0.039897776312298246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,32,0.03964799973699782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,10240,2048,0.09058488739861383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,2560,0.20469421810574004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,10240,768,0.06724355618158977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,10240,256,0.052300443251927696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,51200,1.6192880206637914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,16384,0.5274053149753147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,65536,2.027449713812934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,12288,0.4164942105611165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,16384,0.9303137461344401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,16384,1.0307778252495658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,12288,0.7274337874518501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,10240,0.35941065682305234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,51200,3.3518782721625437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,10240,0.5645110872056749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,8192,0.2883342107137044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,12288,0.7703964445326063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,7168,0.2655288908216688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,10240,0.6515448888142904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,8192,0.46067290835910374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,7168,0.3970035447014703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,65536,4.403081681993273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,6144,0.21454221672481963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,8192,0.5224826600816515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,5120,0.1789697806040446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,6144,0.34050578541225857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,4096,0.1403919988208347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,7168,0.5270871056450738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,51200,3.260835647583008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,6144,0.39902400970458984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,5120,0.3306959999932183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,4096,0.21961777740054658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,3584,0.11864977412753636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,3072,0.10289155774646336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,65536,4.133602566189237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,3584,0.19845688343048096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,2560,0.08283999893400404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,4096,0.29528355598449707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,3584,0.23572889963785806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,3072,0.16894755098554823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,3072,0.21193688445621064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,2048,0.06647555695639716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,1536,0.05027911067008972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,1024,0.03860622313287523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,2560,0.17823733223809135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,2048,0.12309688991970485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,2048,0.14708267317877874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,2560,0.1496595541636149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,1536,0.11981866094801162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,1536,0.09650222460428874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,768,0.02852355440457662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,512,0.021365332934591506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,256,0.01718222267097897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,1024,0.07098311185836792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,1024,0.09159377548429702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,768,0.07760977745056152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,768,0.05772622426350912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,512,0.06296622090869479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,512,0.045829332537121244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,64,0.012772444221708508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,256,0.03825511203871833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,256,0.04782844583193461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,32,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,8192,128,0.03836977812978957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,128,0.03403822249836392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,64,0.03324710991647508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,5120,0.28807910283406574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,8192,32,0.033069332440694175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,16384,0.48934491475423175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,8192,128,0.014701333310869006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,16384,0.8861573537190756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,51200,1.7850231594509547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,65536,1.9623067643907335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,12288,0.35728179083930117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,16384,0.9576329125298394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,10240,0.29444265365600586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,12288,0.7356897989908854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,8192,0.23958312140570748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,12288,0.7335324287414551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,10240,0.5261644257439507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,51200,3.1344487931993275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,7168,0.21631199783749053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,10240,0.6838462087843152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,8192,0.4330471091800266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,6144,0.18345244725545248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,8192,0.48777156405978733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,7168,0.384044435289171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,5120,0.14811378055148655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,51200,2.972022162543403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,7168,0.43750667572021484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,4096,0.11226399739583333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,65536,4.014048682318793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,6144,0.39671733644273544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,5120,0.2669760121239556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,3584,0.1039244466357761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,4096,0.20424889193640816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,5120,0.3091626697116428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,3072,0.08563022481070624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,4096,0.2600204414791531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,2560,0.06996088557773165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,3584,0.18106667200724283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,3584,0.22297067112392852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,3072,0.1568062172995673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,3072,0.1921466721428765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,2048,0.06004710992177328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,1536,0.04435999857054817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,2560,0.13630489508310953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,65536,3.8214552137586804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,2560,0.16878133349948457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,2048,0.11094044314490424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,2048,0.13787378205193415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,1024,0.03328266739845276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,768,0.02569866677125295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,1536,0.11224977175394694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,512,0.01923377811908722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,1024,0.06664533085293241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,768,0.053471999035941235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,256,0.014731556177139282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,6144,0.3225857681698269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,512,0.059122668372260205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,128,0.012229333321253458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,256,0.044906665881474815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,256,0.033956444925732084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,64,0.011117333339320289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,128,0.031176888280444678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,7168,32,0.011368888947698804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,128,0.036095112562179565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,64,0.030761778354644775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,32,0.030208001534144085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,1536,0.08857688638899062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,1024,0.08532000250286526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,7168,768,0.07198133071263631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,7168,512,0.04247644543647766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,16384,0.41588176621331113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,65536,1.73925601111518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,51200,1.4216577741834853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,12288,0.31566932466295033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,16384,0.8178168932596842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,10240,0.2708933353424072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,12288,0.7602986759609647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,16384,0.9277742173936633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,8192,0.2312097814348009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,10240,0.5111813545227051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,51200,2.8277946048312717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,65536,3.4832941691080728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,10240,0.5841626591152614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,8192,0.40622666147020126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,7168,0.18767910533481172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,8192,0.4788631333245172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,6144,0.1554364495807224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,5120,0.13791555828518337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,7168,0.3503155443403456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,51200,2.8162159389919705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,6144,0.3325706587897407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,6144,0.3575919999016656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,4096,0.1144897805319892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,5120,0.2472160127427843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,12288,0.708204428354899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,65536,3.6224454243977866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,5120,0.2986328866746691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,4096,0.19390311506059435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,3072,0.08278222216500176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,4096,0.2372586727142334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,3584,0.1660204463534885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,2560,0.06552710798051622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,3584,0.20976000361972383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,3072,0.14352711041768393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,2048,0.05534755521350437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,3072,0.18984088632795545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,1536,0.04378666811519199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,2560,0.12394044134351943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,2560,0.15806578265296087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,1024,0.030363556411531236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,2048,0.10225422514809503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,2048,0.13215466340382895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,768,0.021524444222450256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,1536,0.08238933483759563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,1536,0.1062871085272895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,512,0.01791200041770935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,1024,0.0814817746480306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,1024,0.06036711401409573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,256,0.013799111048380533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,768,0.06884444422192044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,768,0.048693332407209605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,512,0.03867111272282071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,128,0.011785777906576792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,512,0.05602400170432197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,64,0.010327999790509542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,256,0.030927111705144245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,32,0.01020088874631458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,7168,0.4127075672149658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,128,0.028200000524520874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,64,0.028016000986099243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,6144,32,0.027631999717818365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,6144,3584,0.09515466954973008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,51200,1.008254263136122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,256,0.0422364440229204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,65536,1.299666616651747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,6144,128,0.03387377659479777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,16384,0.3697982099321153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,12288,0.26838933096991646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,16384,0.7139342096116809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,12288,0.6420648892720541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,16384,0.8896427154541016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,12288,0.6591911315917969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,51200,2.4915538363986545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,8192,0.17599111133151582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,10240,0.44546667734781903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,10240,0.5534977912902832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,8192,0.36031466060214573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,7168,0.17066578070322672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,51200,2.6847199334038625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,10240,0.2184035513136122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,6144,0.14147022035386828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,7168,0.313935120900472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,7168,0.3954426712459988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,6144,0.2693564361996121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,5120,0.10695822371376885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,4096,0.09004355801476373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,65536,3.4469360775417752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,6144,0.34090667300754124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,5120,0.22232355011834037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,3584,0.07868888643052843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,5120,0.2824640009138319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,4096,0.17220889197455513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,3072,0.07158666849136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,65536,3.134873708089193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,4096,0.22667821248372397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,3584,0.15158400270673963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,2560,0.0563875569237603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,3584,0.1998071140713162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,2048,0.04502933224042257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,3072,0.1740177737341987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,2560,0.11213955614301895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,1536,0.036483556032180786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,2560,0.15011466874016657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,8192,0.44687202241685653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,2048,0.0944746666484409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,1024,0.026808000273174707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,2048,0.12533511055840388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,768,0.021252445048756067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,512,0.016064888901180692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,1536,0.07483733362621732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,1024,0.0776346657011244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,1024,0.05491911040412056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,768,0.06575733423233032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,768,0.0443484452035692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,256,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,128,0.01039644413524204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,512,0.052008890443378024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,512,0.03495733274353875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,64,0.008969777988062965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,256,0.040864000717798867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,5120,32,0.009323555562231276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,128,0.025474665893448725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,128,0.03240711159176297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,64,0.025379555092917547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,32,0.025384000606007043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,3072,0.13145866658952501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,51200,0.8012746704949273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,5120,1536,0.10114222102695042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,65536,1.0179288652208116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,16384,0.2861848937140571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,5120,256,0.027789334456125896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,12288,0.21634311146206328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,16384,0.6478115717569987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,12288,0.48201868269178605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,10240,0.16782222853766549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,16384,0.8171164194742838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,8192,0.14737599425845677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,10240,0.4051777786678738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,12288,0.6650915675693089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,51200,2.1662587059868708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,7168,0.13126488526662192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,10240,0.5265866915384928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,8192,0.3249315685696072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,7168,0.2848844528198242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,65536,2.849302291870117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,7168,0.36533599429660374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,5120,0.09153155485788982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,6144,0.2454275555080838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,4096,0.06621244218614367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,6144,0.31278933419121635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,5120,0.20163199636671278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,5120,0.26661600006951225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,3584,0.05804710918002658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,51200,2.4538071950276694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,4096,0.15762844350602892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,3072,0.04941244588957893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,4096,0.20843022399478486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,65536,3.147715462578667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,2560,0.043338666359583534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,3584,0.1389697790145874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,3584,0.18403644031948516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,3072,0.11964089340633816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,2048,0.03601866629388597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,3072,0.16022311316596136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,1536,0.02777066661251916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,2560,0.13869067033131918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,2560,0.10162488619486491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,2048,0.08308444420496623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,1024,0.019946666227446664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,768,0.015809777710172866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,1536,0.09377155701319377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,8192,0.41145777702331543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,1024,0.04867466621928745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,1024,0.07221777571572198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,512,0.01220355596807268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,768,0.04001955522431268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,768,0.06083733505672879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,256,0.009700444837411245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,512,0.03189599845144484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,512,0.04846488767200046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,128,0.008613333106040955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,256,0.02529866662290361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,256,0.03732000125779046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,64,0.007630222373538547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,128,0.031480001078711614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,128,0.023034666975339253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,32,0.00775022225247489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,64,0.022686221533351477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,32,0.022635555929607813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,4096,2048,0.11538844638400608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,4096,1536,0.06748800145255195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,51200,0.717448870340983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,65536,1.1063404083251953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,16384,0.26494844754536945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,16384,0.6742071045769585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,4096,6144,0.10604800118340386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,12288,0.18416266971164277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,16384,0.7848755518595377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,12288,0.4607040087381999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,10240,0.17609688970777723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,65536,2.605741288926866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,51200,2.0533360375298395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,12288,0.5808577537536621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,10240,0.385791990492079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,7168,0.12348177697923447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,10240,0.4853946897718642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,8192,0.3102382289038764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,6144,0.10000533527798122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,8192,0.3935946623484294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,7168,0.27185156610276967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,51200,2.3381849924723306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,5120,0.08487377564112346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,7168,0.3478444417317708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,6144,0.23281065622965494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,4096,0.06957955492867364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,3584,0.061879999107784696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,6144,0.2987448904249403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,5120,0.1916595564948188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,4096,0.15017778343624538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,3072,0.048397332429885864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,5120,0.2480106618669298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,2560,0.041413333680894636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,3584,0.1308257712258233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,3584,0.1755031082365248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,8192,0.140754673216078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,3072,0.113681779967414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,2048,0.03494044476085239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,1536,0.024481778343518574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,2560,0.09701155291663276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,2560,0.13230933083428278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,1024,0.018017777138286166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,2048,0.078712887234158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,2048,0.11101510789659287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,768,0.014418666561444601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,1536,0.06309244367811415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,1536,0.089264002111223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,512,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,1024,0.04618577824698555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,1024,0.06892444690068562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,256,0.00923822240697013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,768,0.05833333068423801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,768,0.03776622149679396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,128,0.007828444242477417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,512,0.03026311265097724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,512,0.04549511273701986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,64,0.007256000406212277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,256,0.023702222439977858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,256,0.036995556619432234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3584,32,0.007613333563009898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,128,0.03071111109521654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,128,0.02166755497455597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,65536,2.994244469536675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,64,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3584,32,0.02130577796035343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,4096,0.19828532801734078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,16384,0.21679288811153838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,51200,0.6516213417053223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,65536,0.7596524556477865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,12288,0.1646560033162435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,16384,0.5819404390123155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,12288,0.48900800281100804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,10240,0.13932711548275417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3584,3072,0.15390577581193712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,12288,0.5747893121507432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,8192,0.11603466669718425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,10240,0.3654471238454183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,10240,0.48363468382093644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,8192,0.29299643304612905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,65536,2.411458757188585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,7168,0.09746399852964614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,8192,0.39188800917731387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,51200,2.3227920532226562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,7168,0.25786399841308594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,6144,0.07901866568459405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,7168,0.34538666407267254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,5120,0.07042755683263142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,16384,0.8049031363593208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,6144,0.2212515539593167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,4096,0.05810844235950046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,6144,0.29675110181172687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,5120,0.1821946700414022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,5120,0.24627465671963164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,51200,1.8688435024685328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,65536,2.9770249260796438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,4096,0.1428782277637058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,4096,0.19744000169965956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,3584,0.12422845098707412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,3584,0.17442754904429117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,2560,0.03352533446417914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,3072,0.10742488834593032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,2048,0.027853333287768896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,3072,0.15202755398220485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,1536,0.02130844526820713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,2560,0.09115288654963176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,2560,0.13150755564371744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,2048,0.10946400298012628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,2048,0.07460355758666992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,1024,0.015625778171751235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,768,0.012788444757461548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,1536,0.05679555733998617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,1536,0.08760888708962335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,512,0.01038044442733129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,1024,0.06792889038721721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,1024,0.04265955421659681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,768,0.0354746679464976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,512,0.04530400037765503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,512,0.028367999527189467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,128,0.007302222152551015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,256,0.022299556268586054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,256,0.03530933459599813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,64,0.006591111007663939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,128,0.02950577934583028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,128,0.020298666424221463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,32,0.006614222294754452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,3584,0.04864889052179125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,3072,0.03962666789690653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,32,0.019911999503771465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,3072,64,0.019876443677478366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,51200,0.44136712286207413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,65536,0.6828506787618002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,16384,0.17339021629757354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,3072,768,0.05674755573272705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,12288,0.13124622239006892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,16384,0.6470906469557021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,12288,0.4096497694651286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,10240,0.11116888788011338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,16384,0.7526524331834582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,51200,1.7522978252834742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,8192,0.09279821978674994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,12288,0.5532693333095974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,10240,0.3447546694013808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,3072,256,0.00795999997191959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,7168,0.0797591143184238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,65536,2.228439966837565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,10240,0.4630888832939996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,6144,0.07350489166047838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,8192,0.2786826557583279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,7168,0.24496266576978895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,5120,0.05961510870191786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,8192,0.37322399351331925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,51200,2.2133519914415145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,6144,0.21005511283874512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,7168,0.32943110995822483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,4096,0.048362665706210665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,3584,0.039107554488711886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,6144,0.28367556465996635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,5120,0.17280266020033094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,3072,0.03402933478355408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,5120,0.23447910944620767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,4096,0.13503377967410618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,3584,0.11846666865878636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,4096,0.1882542239295112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,2048,0.025217778152889673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,3072,0.1022426684697469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,3072,0.14548356003231472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,2560,0.08659999900394016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,1536,0.020201777418454487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,2560,0.12485510773128933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,1024,0.015458666616015963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,2048,0.07040177451239692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,2048,0.10413866572909886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,768,0.012786666552225748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,1536,0.053856889406840004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,1024,0.06555289030075073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,1024,0.040250665611690946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,512,0.009655111365848118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,768,0.03304355674319797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,768,0.054177777634726636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,256,0.007658667034573025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,512,0.02638133366902669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,512,0.043046222792731396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,128,0.006593777901596493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,256,0.020928889513015747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,256,0.03394844465785556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,64,0.0059262220230367445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,128,0.01923377811908722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,128,0.02867022156715393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,32,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,64,0.018535999788178336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2560,32,0.018552889426549275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2560,2560,0.029370665550231934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,3584,0.16581688986884222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,65536,2.8266675737169056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,65536,0.47949955198499894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2560,1536,0.08396177821689182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,16384,0.14261778195699057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,16384,0.5125475459628636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,12288,0.09836000204086304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,16384,0.7007324430677625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,12288,0.38812888993157285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,51200,0.3952337900797526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,51200,1.6247200436062281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,10240,0.08871377838982476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,8192,0.07084177600012885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,12288,0.5219973458184136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,65536,2.068910174899631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,7168,0.06554310851626925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,10240,0.32606222894456655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,8192,0.2635635534922282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,10240,0.437316444185045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,6144,0.051544000705083214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,8192,0.35469778378804523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,7168,0.23186310132344565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,5120,0.04775644342104594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,7168,0.3127280076344808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,51200,2.092920939127604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,6144,0.19826132721371123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,4096,0.03812177644835578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,3584,0.03124177787039015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,6144,0.2694515652126736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,5120,0.16348800394270155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,5120,0.22274578942192924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,3072,0.02773777809407976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,65536,2.6781323750813804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,2560,0.022856889499558344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,4096,0.1776311132642958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,3584,0.1113742192586263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,3584,0.15762133068508571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,3072,0.09582577811347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,3072,0.13785600662231445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,1536,0.016142222616407607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,2560,0.11936177147759332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,2560,0.08114311430189344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,1024,0.011942221886581846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,2048,0.068013330300649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,2048,0.09911733203464085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,768,0.009921777579519484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,1536,0.0805600020620558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,1024,0.05965955389870537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,512,0.00795288880666097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,768,0.051190220647388034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,768,0.03144800000720554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,256,0.006540444576077991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,512,0.04215733210245768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,512,0.025060445070266724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,128,0.005892444401979446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,256,0.033257779147889875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,256,0.01960711181163788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,64,0.005146666533417172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,32,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,2048,128,0.027800000376171533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,128,0.017881777551439073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,64,0.017501332693629794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,32,0.01739022301303016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,4096,0.12707555294036865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,65536,0.40588800112406415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,51200,0.3164364496866862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,2048,2048,0.01975822283162011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,16384,0.10249600145551895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,1536,0.0521964430809021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,2048,1024,0.0369137790468004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,12288,0.08261333571539985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,16384,0.48316176732381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,10240,0.07388089100519817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,12288,0.3652186658647325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,16384,0.6979289054870605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,12288,0.5172773467169868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,8192,0.057061334451039634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,10240,0.30729156070285374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,7168,0.048680888281928174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,10240,0.4349813461303711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,8192,0.24792888429429796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,51200,1.4984106487698023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,65536,1.9122418297661676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,7168,0.21775466865963408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,8192,0.35314755969577366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,6144,0.04469511244032118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,5120,0.036566221051745944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,4096,0.028169777658250596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,7168,0.3109075493282742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,6144,0.185917337735494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,5120,0.1528115537431505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,5120,0.22103822231292725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,6144,0.2673208978441027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,4096,0.11950222651163737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,3584,0.02427111069361369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,3072,0.020908445119857788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,3584,0.10394489102893406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,3072,0.09050489134258694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,2560,0.019679110911157396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,3072,0.13620266649458143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,51200,2.077440049913194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,2048,0.015626667274369132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,2560,0.11775822109646267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,65536,2.650367101033529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,1536,0.01311822235584259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,2048,0.09882666667302449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,2048,0.06304355462392171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,1024,0.010002666877375709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,1536,0.04885511265860664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,1536,0.07925066683027479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,1024,0.034345779154035784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,1024,0.05923200315899319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,512,0.007334222396214803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,768,0.029447111818525527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,768,0.05033955640263028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,512,0.023336889015303716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,256,0.006285333385070165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,512,0.040272000763151385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,128,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,256,0.031799111101362444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,256,0.018202667435010273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,64,0.004873777843183941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,128,0.02648888859483931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,32,0.004857777721352047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,4096,0.17635911040835908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,64,0.016153777639071148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1536,3584,0.15619644853803846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,32,0.015814221567577787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,2560,0.07628977961010404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,65536,0.29541156027052135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,51200,0.2331226666768392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,16384,0.07299466927846272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1536,768,0.008683555656009251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,16384,0.47277243932088214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1536,128,0.01648355523745219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,16384,0.6456061999003092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,10240,0.04887110988299052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,12288,0.34818400277031797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,51200,1.3919280370076497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,12288,0.49020889070298934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,10240,0.2872222264607747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,8192,0.03601422243648105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,65536,1.7673333485921223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,7168,0.03420266509056091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,10240,0.4125608868069119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,8192,0.23219111230638292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,7168,0.20351200633578828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,8192,0.333459562725491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,7168,0.2946213351355659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,5120,0.0236791107389662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,12288,0.05712178018358019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,51200,1.9644035763210719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,6144,0.17463555600908068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,6144,0.2542960113949246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,5120,0.14301244417826334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,3584,0.017636444833543565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,4096,0.1110195583767361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,4096,0.16740443971421984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,3072,0.015227556228637695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,3584,0.09655555751588608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,3584,0.14766577879587808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,2560,0.013931555880440606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,3072,0.08399022287792629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,3072,0.12924444675445557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,2048,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,2560,0.07108533382415771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,2560,0.1120248900519477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,1536,0.009708444277445475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,2048,0.0932568907737732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,2048,0.05812622441185845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,1024,0.00794488853878445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,1536,0.04419377777311537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,6144,0.02806666824552748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,768,0.006976000136799282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,1024,0.03206933206982083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,512,0.005657777604129579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,768,0.027141332626342773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,768,0.04827288786570231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,256,0.004751111070315043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,4096,0.01938666734430525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,512,0.021765333082940843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,512,0.03907555672857497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,128,0.004219555606444676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,256,0.017024889588356018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,256,0.030478222502602473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,5120,0.20965866247812906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,64,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,128,0.026047110557556152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,1024,32,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,65536,2.5044053395589194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,128,0.014879110786649915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,64,0.01479555500878228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,1024,32,0.014440889159838358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,65536,0.2444737752278646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,51200,0.19335911009046766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,16384,0.06617066595289442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,1536,0.0754400028122796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,1024,1024,0.05676888757281833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,12288,0.04792444573508369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,16384,0.4472186830308702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,12288,0.3332284556494819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,10240,0.039750221702787615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,12288,0.4940515624152289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,51200,1.347876442803277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,8192,0.030850665436850652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,10240,0.27990134557088214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,65536,1.719361729092068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,7168,0.02754488918516371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,8192,0.22574488321940103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,10240,0.40999288029140896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,6144,0.023411555422676936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,8192,0.331965340508355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,7168,0.19768177138434517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,5120,0.020261334048377145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,7168,0.29264354705810547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,51200,1.9595902760823567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,6144,0.16966044902801514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,4096,0.01704088846842448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,6144,0.25302667087978786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,5120,0.13934489091237387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,3584,0.015441776977645027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,16384,0.6420719888475206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,4096,0.10809155305226643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,3072,0.01364177796575758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,4096,0.16653954982757568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,2560,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,3584,0.09379555781682332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,3584,0.1475671132405599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,2048,0.010334221853150262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,3072,0.1292924483617147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,2560,0.06942400005128649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,2560,0.11179644531673855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,1536,0.008376888930797577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,2048,0.056002669864230685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,2048,0.09284977780448066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,1024,0.007277333074145847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,1536,0.07384800248675875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,1536,0.04359289010365804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,768,0.00656088896923595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,512,0.005543111099137201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,1024,0.03115644388728672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,1024,0.05600533220503065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,256,0.004546666724814309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,768,0.026643556025293138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,768,0.04769777920511034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,512,0.038615110847685076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,128,0.004210666649871402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,256,0.03085244364208645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,256,0.016149333781666227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,64,0.003657777690225177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,128,0.014494222071435718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,768,32,0.0038897775941424896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,64,0.014105778601434497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,65536,2.497694227430556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,32,0.014057776994175382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,65536,0.18067733446756998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,51200,0.1393671168221368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,3072,0.0814337796635098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,16384,0.04376533296373156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,16384,0.4201333257887099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,768,512,0.02127200033929613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,12288,0.031758222315046526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,128,0.025748444928063288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,768,5120,0.20822578006320527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,10240,0.025791999366548326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,12288,0.3187493218315972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,51200,1.290801790025499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,8192,0.020599111914634705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,16384,0.6073999934726292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,12288,0.4606169064839681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,65536,1.6457555558946397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,7168,0.018160889546076458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,10240,0.2674373255835639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,6144,0.01607822212908003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,8192,0.21601333883073595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,10240,0.3875324461195204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,5120,0.013904889424641928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,8192,0.3141760031382243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,7168,0.18992088900672066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,7168,0.27740976545545787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,4096,0.011586666935020022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,6144,0.16257866223653158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,51200,1.844879150390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,3584,0.01072622256146537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,6144,0.23925778600904676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,5120,0.133389327261183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,3072,0.009504888620641496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,5120,0.19734844896528456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,4096,0.10314666562610203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,2560,0.00851288851764467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,3584,0.08929866552352905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,3584,0.13945510652330187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,65536,2.3570132785373263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,3072,0.0771520005332099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,2048,0.0073315559162033936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,3072,0.12164889441596137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,1536,0.006264888991912206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,2560,0.06475733386145698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,2560,0.10504711336559719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,1024,0.005393777870469623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,2048,0.08808088964886135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,2048,0.052314665582444936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,1536,0.041441778341929116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,1536,0.06888444556130303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,768,0.004876444323195351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,512,0.004233777936961916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,1024,0.02964622113439772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,1024,0.05317244595951504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,256,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,768,0.0452551113234626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,768,0.025359110699759588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,512,0.020234665936893888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,128,0.00378222225440873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,64,0.003302222324742211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,256,0.029105779197480943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,256,0.015464888678656684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,128,0.02405244443151686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,512,32,0.003540444291300244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,128,0.0136835558546914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,64,0.013396444420019785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,65536,0.10159911049736871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,512,32,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,51200,0.08577422300974528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,16384,0.03170133299297757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,4096,0.15741954909430608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,16384,0.40928178363376194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,12288,0.024872000018755596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,512,512,0.036561777194341026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,16384,0.6027288966708714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,12288,0.3094835546281603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,51200,1.2494755850897896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,65536,1.596570650736491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,10240,0.2601777712504069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,12288,0.4572399987114801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,8192,0.017344888713624742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,7168,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,10240,0.38484978675842285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,8192,0.2098888953526815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,6144,0.01333688861793942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,51200,1.834140353732639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,7168,0.18456621964772543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,5120,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,7168,0.27519912189907497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,6144,0.15794400374094644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,5120,0.12923999627431235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,6144,0.23778133922153047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,65536,2.3385236528184676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,5120,0.19578399923112658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,3584,0.008269333177142674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,3072,0.007276444799370236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,10240,0.020925333102544148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,4096,0.10043288601769342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,4096,0.15602933035956487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,2560,0.006671111202902264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,3584,0.13817777898576525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,3584,0.08632266521453857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,3072,0.07513333029217191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,2048,0.006220444622966979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,3072,0.12064533763461643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,1536,0.0052177777720822235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,2560,0.10422666867574056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,2048,0.050275554259618126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,2048,0.08687822024027507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,1536,0.06768977642059326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,768,0.0042160000238153665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,1024,0.0284862220287323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,768,0.024341333243581984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,512,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,8192,0.3114986684587267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,512,0.01960711181163788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,512,0.036222222778532244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,256,0.003489777859714296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,4096,0.008998221821255153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,128,0.00318755561278926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,256,0.02826489011446635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,256,0.01482222146458096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,64,0.002887111157178879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,128,0.01311644415060679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,128,0.023694222172101338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,32,0.00318755561278926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,64,0.012768000364303589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,65536,0.07719822062386407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,32,0.012431110772821637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,2560,0.06341599755816989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,51200,0.06281066603130765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,256,1024,0.004564444637960858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,256,1536,0.038966221941841975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,16384,0.026782222919993933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,1024,0.052367998494042285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,256,768,0.0453342232439253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,12288,0.01793866687350803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,16384,0.39905156029595273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,16384,0.6004906760321723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,10240,0.0155404441886478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,12288,0.30206312073601616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,12288,0.4563342200385199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,8192,0.013177778157922955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,10240,0.2538204458024767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,51200,1.2178017298380535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,7168,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,10240,0.38368977440728086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,65536,1.5568248960706923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,6144,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,8192,0.20505689250098336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,7168,0.1799724499384562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,8192,0.3108924494849311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,5120,0.009465778039561378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,7168,0.27402488390604657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,6144,0.15429777569240993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,4096,0.008009778128729926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,6144,0.23686665958828398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,51200,1.829180399576823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,3584,0.007608888877762689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,5120,0.1258995532989502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,5120,0.19482489426930746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,4096,0.09728178050782944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,4096,0.15540088547600642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,2560,0.006241777704821692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,3584,0.08410222000545925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,3584,0.13762222396002874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,65536,2.3335111406114364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,3072,0.07234044207466973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,3072,0.11972267097896999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,1536,0.004928888960017098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,2560,0.061405334207746715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,2560,0.10333155261145698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,1024,0.004242666479614046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,2048,0.08708355824152629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,2048,0.04935288760397169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,768,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,1536,0.0674275557200114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,1536,0.03820711043145921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,512,0.0035333335399627686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,1024,0.05243644449445936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,1024,0.027775110469924078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,256,0.0033448889023727844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,768,0.023904000719388325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,768,0.0447617769241333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,128,0.0028906667398081887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,512,0.019167110323905945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,512,0.03609866566128201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,64,0.0028702221396896574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,256,0.014448889427714877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,32,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,128,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,128,0.02330400049686432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,64,0.01238844460911221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,65536,0.07146666447321574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,128,32,0.012049777640236748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,51200,0.0580000016424391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,16384,0.0233608881632487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,12288,0.014152889450391134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,3072,0.0069013333155049225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,10240,0.012468444804350534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,8192,0.010563555690977307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,128,2048,0.005561777700980504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,7168,0.010799110763602786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,12288,0.3016471068064372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,10240,0.2531742254892985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,6144,0.010230222509966956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,16384,0.3979315492841933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,8192,0.20471555656856963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,5120,0.008968888885445064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,4096,0.007616000043021307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,3584,0.007269333634111617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,7168,0.17991911040412056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,6144,0.15345244937472874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,5120,0.12589066558414036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,3072,0.006587555425034628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,2560,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,3584,0.08409955766465928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,2048,0.005196444276306364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,1536,0.004852444347408083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3328,128,256,0.02776977750990126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,3072,0.07260444429185656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,2560,0.061342219511667885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,1024,0.004192000048028098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,768,0.0038684445122877755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,512,0.0032915555768542816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,1536,0.03836799992455377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,256,0.0034008889148632684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,51200,1.2185822592841256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,1024,0.027863999207814533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,768,0.023583999938435022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,128,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,64,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,512,0.01889866590499878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,64,32,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,256,0.014440889159838358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,128,0.012418666647540199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,65536,1.556460486518012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,64,0.01183111137813992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,32,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,51200,0.05899910794364082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,16384,0.022974222898483276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,12288,0.011037333144081963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,12288,0.3019084400600857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,16384,0.3982231087154812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,4096,0.09668444262610541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,10240,0.01035288886891471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,8192,0.00903555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,7168,0.009668444593747457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,64,2048,0.04829333225886027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,10240,0.2531155480278863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,6144,0.008989333278603023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,8192,0.20472089449564615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,5120,0.011006222003036074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,4096,0.009357333183288574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,5120,0.12593689229753283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,6144,0.15375022093454996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,65536,0.07630133628845215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,3584,0.008957333034939235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,4096,0.0969546635945638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,3072,0.007777777810891469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,2560,0.0069644442862934535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,2048,0.005413333161009683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,3584,0.08415644698672825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,3072,0.07307289044062297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,2560,0.061117331186930336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,1536,0.004580444345871608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,65536,1.555827564663357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,1024,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,2048,0.04803644286261665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,768,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,512,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,256,0.0031973332580592898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,1536,0.03793688946300083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,1024,0.027592889136738245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,768,0.023983110984166462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,128,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,512,0.018971555762820773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,64,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,256,0.014158222410413953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,128,0.012406222522258759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,64,0.012230222423871359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,32,0.012075555821259817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,7168,0.17957154909769693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3328,32,51200,1.2182800504896376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3328,32,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,12288,3.0408462948269315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,10240,2.865443547566732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,16384,3.7587610880533853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,12288,3.4956160651312937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,10240,2.7373085021972656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,16384,4.676152123345269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,8192,2.1507786644829645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,6144,1.5767884784274633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,7168,1.8881414201524522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,7168,1.8607368469238281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,8192,2.162033716837565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,6144,1.5525582631429036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,5120,1.3314861721462674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,4096,1.0695884492662218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,3584,0.907342274983724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,4096,1.0327431360880535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,5120,1.3000213834974501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,3072,0.7577946450975207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,3584,0.898864852057563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,2560,0.6928470929463705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,2048,0.48931466208563906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,3072,0.8180426491631402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,2560,0.6600560082329644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,1536,0.35243911213344997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,1024,0.2694586647881402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,768,0.19070311387379965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,512,0.15567378203074136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,1024,0.32534223132663304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,1536,0.5450995763142904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,768,0.27537067731221515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,256,0.11923910511864556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,512,0.21738133165571424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,128,0.09694221946928237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,64,0.08221066660351224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,32,0.08744711346096462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,256,0.19231732686360678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,128,0.18646489249335396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,64,0.1842879984113905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,32,0.19276711675855848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,2048,0.5649111005995009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,16384,2.9750258127848306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,65536,51200,12.165577358669706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,16384,3.741685231526693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,12288,2.2668880886501737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,12288,2.673071119520399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,10240,1.9435147179497614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,10240,2.1865857442220054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,8192,1.5430222617255316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,8192,1.6999698215060766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,7168,1.304016007317437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,51200,9.343631320529514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,6144,1.0940382215711806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,7168,1.4932862387763128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,5120,0.9721750683254666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,5120,1.0591164694892037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,6144,1.2607475916544597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,65536,51200,20.01947699652778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,4096,0.7523075739542643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,4096,0.8450729052225748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,3584,0.705633799235026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,65536,12.191197713216146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,3584,0.7458711200290256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,3072,0.6068453258938259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,2560,0.5710479948255751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,3072,0.6271004676818848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,2048,0.38961511188083225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,1536,0.3653137683868408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,2048,0.4708417786492242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,1024,0.2209564447402954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,1536,0.34152889251708984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,768,0.17833599779340956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,512,0.13596977127922907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,2560,0.5463351143731011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,768,0.20492355028788248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,256,0.09197955661349827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,128,0.0690222250090705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,1024,0.36291199260287815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,64,0.06020355224609375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,512,0.1744133366478814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,51200,32,0.06400622261895074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,128,0.14567911624908447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,64,0.14813333087497288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,256,0.15712089008755153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,32,0.14987288581000432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,16384,1.105696890089247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,16384,1.3907626469930012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,12288,0.8181573549906412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,51200,15.894678751627604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,10240,0.6490657594468858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,51200,2.972858640882704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,12288,1.0117004182603624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,10240,0.8692435688442655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,8192,0.5949084493849013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,7168,0.4633297920227051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,65536,4.005547417534722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,8192,0.6810391214158801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,6144,0.45541069242689347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,7168,0.5844720204671224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,6144,0.5646142429775661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,5120,0.34498932626512313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,4096,0.30712445576985675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,5120,0.41024621327718097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,3584,0.22968710793389213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,4096,0.32483821445041233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,3072,0.23051555951436362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,2560,0.1615013281504313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,3584,0.35888089074028867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,3072,0.24640443589952257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,2048,0.1582826640870836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,1536,0.10575022300084432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,2560,0.210171553823683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,1024,0.08840622504552205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,2048,0.1954417758517795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,768,0.06217510832680596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,1536,0.1373751163482666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,512,0.04325777623388502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,256,0.03126222226354811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,1024,0.12138488557603623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,768,0.09541955259111191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,128,0.025041777226659987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,512,0.0703502231174045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,64,0.02418577836619483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,256,0.06198933389451769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,16384,32,0.025175111161337957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,128,0.05739021963543362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,64,0.05706933471891615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,32,0.062408890989091664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,51200,5.696419609917535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,51200,65536,19.92042711046007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,16384,0.7425448629591199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,12288,0.5490364498562282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,16384,65536,6.849808163113064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,16384,1.1574630737304688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,12288,0.884394645690918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,10240,0.5721911324395074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,8192,0.3752675586276584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,10240,0.7060942120022244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,51200,2.4188550313313804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,7168,0.37702488899230957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,8192,0.5509289105733236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,7168,0.5102888743082682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,5120,0.24580266740587023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,65536,2.998363494873047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,6144,0.4568382369147406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,4096,0.18660355938805473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,5120,0.33672889073689777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,3584,0.1998088889651828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,4096,0.27828534444173175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,3072,0.13308621777428523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,3584,0.23904000388251412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,2048,0.10029777553346421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,3072,0.20177600118849012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,2560,0.13563377327389187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,1536,0.07639022005928887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,2560,0.17672533459133574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,1024,0.054189334313074745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,1536,0.13103644053141275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,2048,0.14335555500454372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,512,0.03262666530079312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,6144,0.2824453247918023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,768,0.07134399811426799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,256,0.02437866727511088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,1024,0.08574844731224908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,128,0.01998666591114468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,512,0.05845333470238579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,64,0.0177839994430542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,32,0.018048889107174344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,128,0.045775112178590566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,64,0.04532177911864387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,32,0.045216000742382474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,51200,4.323458777533637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,12288,768,0.04085866610209147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,256,0.05071111188994514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,16384,0.6188080045912001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,12288,65536,5.843889872233073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,12288,0.4608124627007379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,10240,0.4429057704077826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,51200,2.0292676289876304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,16384,0.9952258004082574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,12288,0.7892710897657605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,65536,2.426344977484809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,8192,0.38730843861897785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,10240,0.6518666479322646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,7168,0.29010044203864205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,6144,0.2763893339369032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,5120,0.20545244216918945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,7168,0.42871999740600586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,4096,0.16506932841406927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,5120,0.32504532072279185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,6144,0.4320533275604248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,3584,0.14212800396813288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,3072,0.12136356035868327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,4096,0.24543823136223686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,2560,0.1021253334151374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,2048,0.08802488777372573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,3584,0.23630221684773764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,3072,0.19626755184597441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,1536,0.06346844302283393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,1024,0.04864355590608385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,2560,0.15495733420054117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,768,0.038322667280832924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,1536,0.10448710785971747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,512,0.02863022353914049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,1024,0.07836977640787761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,256,0.02097333305411869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,768,0.062032891644371875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,128,0.017438222964604694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,64,0.014886221951908536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,512,0.05197599861356947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,256,0.042598221037122935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,10240,32,0.015108444624476962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,128,0.0377146667904324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,64,0.037802666425704956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,8192,0.5350293583340114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,32,0.03774311145146688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,51200,3.85114754570855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,16384,0.48102309968736434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,2048,0.12976800070868597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,12288,0.396578656302558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,10240,65536,5.024101257324219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,16384,0.8698897891574435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,10240,0.31519556045532227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,12288,0.6378835572136773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,51200,1.5178053114149306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,8192,0.24026311768425834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,7168,0.21683911482493082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,10240,0.570266670650906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,65536,1.9327990214029949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,5120,0.16686311033036974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,8192,0.4520950847201877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,7168,0.4122622278001573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,4096,0.1317360003789266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,6144,0.3168959882524279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,3584,0.11952088938819037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,5120,0.28045156266954213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,3072,0.10480622450510661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,4096,0.20809243785010445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,2560,0.08189777533213298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,2048,0.07335378064049615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,3584,0.18982577323913574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,3072,0.16050044695536295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,1536,0.052799999713897705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,2560,0.1347635587056478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,1024,0.0361422234111362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,768,0.027655111418830022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,2048,0.11413244406382243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,512,0.021309332715140447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,1536,0.09212533632914226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,256,0.017424000634087455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,768,0.05390933487150404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,512,0.043790221214294434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,256,0.035262223747041486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,6144,0.20149600505828857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,64,0.012159110771285163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,128,0.03277066681120131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,32,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,64,0.0322017769018809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,51200,3.1141866048177085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,32,0.03188800149493747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,1024,0.06753422154320611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,8192,65536,4.180120680067274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,8192,128,0.013707555830478668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,12288,0.3218302196926541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,16384,0.44770489798651797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,51200,1.3700692918565538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,10240,0.31147556834750706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,65536,1.8437716166178386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,16384,0.8178888956705729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,8192,0.2519902123345269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,12288,0.613809797498915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,7168,0.21030578348371717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,10240,0.5273911158243815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,6144,0.17193688286675346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,8192,0.4204897880554199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,5120,0.14361333847045898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,4096,0.10899644427829319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,6144,0.29542578591240776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,3584,0.09393955601586236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,4096,0.19610488414764404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,3072,0.0932026637925042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,2560,0.0736115574836731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,3584,0.16665866639879015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,2048,0.056707554393344455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,3072,0.14653600586785212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,1536,0.04778755704561869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,2560,0.12771466043260363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,1024,0.03257688879966736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,768,0.023941333095232647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,51200,2.868864059448242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,2048,0.10405421919292873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,512,0.0184551113181644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,1536,0.08278577857547335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,256,0.01484266585773892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,1024,0.06168444289101494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,128,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,768,0.04965333475006951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,64,0.011398221883508893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,512,0.04031377699640062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,256,0.03275022241804335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,7168,32,0.013005333642164866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,128,0.030024889442655776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,64,0.02979466650221083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,32,0.029291556941138372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,65536,3.655096689860026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,7168,0.39774399333530003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,7168,5120,0.245011568069458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,16384,0.38095821274651426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,12288,0.2896328767140706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,10240,0.22903643714057076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,8192,0.18615021970536974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,12288,0.544091542561849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,16384,0.7346613142225477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,10240,0.4820355309380426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,51200,1.2745929294162326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,7168,0.1708079973856608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,6144,0.1444551150004069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,5120,0.13876267274220785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,8192,0.3935191101498074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,65536,1.665172470940484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,7168,0.31895555390252006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,4096,0.11112266116672093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,6144,0.32524000273810494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,3584,0.11852622032165527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,5120,0.2321875625186496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,4096,0.17858044306437174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,2560,0.0878408882353041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,3584,0.15389866299099392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,2048,0.057667553424835205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,1536,0.041231112347708807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,3072,0.146415114402771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,1024,0.026851556367344324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,2560,0.11708445019192165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,768,0.023120888405376013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,2048,0.1231973303688897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,512,0.01704355577627818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,1536,0.07787377966774835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,256,0.015535111228624979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,1024,0.0570346646838718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,128,0.011316444310877057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,768,0.04603200157483419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,64,0.00980177770058314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,512,0.042966223425335355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,32,0.009834667046864828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,256,0.029551111989551123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,128,0.027781334188249376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,64,0.027429333991474573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,32,0.02776799930466546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,51200,2.5533165401882596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,16384,0.31503023041619194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,6144,3072,0.08374400271309747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,12288,0.23338399993048775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,6144,65536,3.461433834499783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,16384,0.6670097774929471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,51200,0.9919875462849935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,65536,1.2668630811903212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,10240,0.20815732744004992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,8192,0.1825608942243788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,12288,0.5466560257805718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,7168,0.13946755727132162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,10240,0.415117343266805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,6144,0.11949955092536078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,5120,0.09683199723561604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,8192,0.3676755428314209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,7168,0.35495466656155056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,4096,0.07635288768344455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,6144,0.262480894724528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,3584,0.08351644542482163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,5120,0.2109146647983127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,3072,0.06372800138261583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,4096,0.165775113635593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,3584,0.14136444197760686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,2048,0.04378222094641792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,3072,0.1345920032925076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,1536,0.03524000114864773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,2560,0.10736088620291816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,1024,0.02568799919552273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,768,0.020783111453056335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,1536,0.0720977783203125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,51200,2.2855023278130426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,512,0.016473778420024447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,768,0.04226311047871908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,256,0.012099555797047086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,128,0.01034400032626258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,512,0.033923556407292686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,256,0.027149332894219294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,64,0.008985777695973715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,128,0.024901333782407973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,32,0.009185777770148383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,64,0.024689777029885188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,32,0.024354666471481323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,65536,2.9654443528917103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,5120,2560,0.05061422122849358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,2048,0.08866310781902736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,16384,0.2631466653611925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,5120,1024,0.05118311113781399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,65536,0.9295226203070747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,51200,0.8023262023925781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,12288,0.19500799973805746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,10240,0.18551554944780138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,8192,0.14423910776774088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,7168,0.13983110586802164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,16384,0.5998302035861546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,12288,0.4521999888949924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,6144,0.11788711282942031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,7168,0.26753422949049205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,10240,0.48012802335951066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,5120,0.08295022116767035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,4096,0.06798488563961454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,3584,0.056186669402652316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,3072,0.050028443336486816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,6144,0.22684711880154082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,5120,0.21063555611504448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,4096,0.15103288491566977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,2560,0.04298399885495504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,2048,0.03536355495452881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,3584,0.1286826663547092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,1536,0.027424888478385076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,3072,0.11241155200534397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,1024,0.020131554868486192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,2560,0.10147111283408271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,2048,0.07820000251134236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,768,0.01647555496957567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,512,0.011843555503421359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,1536,0.06288088692559136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,256,0.009481777747472128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,1024,0.04595288965437147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,128,0.008332444561852349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,768,0.03942222065395779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,512,0.030040889978408813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,64,0.007292444507280986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,51200,2.0731343163384333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,256,0.024021334118313257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,4096,32,0.00776622196038564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,128,0.022335999541812476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,32,0.021993777818149988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,64,0.022892443670166865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,8192,0.31623199250963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,4096,65536,2.5965360005696616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,16384,0.22302044762505424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,12288,0.17705510722266304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,10240,0.16332266065809461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,8192,0.13249599933624268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,51200,0.7201742066277398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,16384,0.5702364179823134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,65536,0.861220465766059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,12288,0.4287395477294922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,10240,0.36101778348286945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,5120,0.07729422383838229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,8192,0.2949742211235894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,7168,0.25301067034403485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,4096,0.06230311261283027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,6144,0.21563288900587294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,3584,0.05307822095023262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,5120,0.17802045080396864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,3072,0.05111822154786852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,4096,0.13926133844587538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,2560,0.0402728882100847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,3584,0.12245689498053657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,2048,0.030934221214718286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,3072,0.10629689031177098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,1536,0.024674667252434626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,2560,0.09059466918309529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,1024,0.01703733371363746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,2048,0.07351555426915486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,768,0.013973333769374423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,51200,1.921145757039388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,1536,0.059176001283857554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,512,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,1024,0.043450666798485645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,256,0.00906133320596483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,7168,0.12847199704911974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,128,0.00795377790927887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,6144,0.10319555468029445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,512,0.028392000330819026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,64,0.007142222589916653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3584,32,0.007688889073001013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,128,0.021165332860416834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,65536,2.4454292721218533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,32,0.020630222227838304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,64,0.020956445071432326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,16384,0.2201519939634535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,51200,0.6441546546088325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,65536,0.8342000113593208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,12288,0.1798106696870592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,16384,0.5440933439466689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,768,0.03636799918280707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,10240,0.13784444332122803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3584,256,0.023077333966890972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,8192,0.09800710943010117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,12288,0.4459226926167806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,7168,0.09042488866382176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,10240,0.3402764532301161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,6144,0.07816977633370294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,7168,0.2400595611996121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,5120,0.06496800316704644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,8192,0.31932356622484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,4096,0.050599998897976346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,6144,0.20397778352101645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,3584,0.052616000175476074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,3072,0.03861155443721347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,2560,0.03943999939494663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,2048,0.029511110650168523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,4096,0.13172266218397352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,51200,1.7472506629096136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,3584,0.11636711491478814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,3072,0.10048266914155747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,2560,0.08557422293557061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,1024,0.01758577757411533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,768,0.014505777094099255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,2048,0.07077955537372164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,512,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,256,0.009000889129108852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,1024,0.04079200161827935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,768,0.03328355484538608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,65536,2.2390889061821833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,512,0.02685866587691837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,256,0.02167644434505039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,64,0.007479999628331926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,128,0.01995022263791826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,64,0.01959733333852556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,32,0.019542222221692402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,51200,0.45658667882283527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,5120,0.17249243789248994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,1536,0.023278221487998962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,16384,0.1573759979671902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,12288,0.12193332778082953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,128,0.00830488900343577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,10240,0.09261155790752834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,3072,32,0.007884444461928474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,8192,0.07706133524576823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,12288,0.38558043373955625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,7168,0.0714026689529419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,10240,0.32127732700771755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,8192,0.2594133218129476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,65536,0.6195395787556967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,5120,0.047338667843076915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,6144,0.19360444280836317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,4096,0.03991644581158956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,65536,2.0835083855523004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,3072,1536,0.05398133397102356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,5120,0.15917866759830052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,3584,0.03920266694492764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,3072,0.03469511204295688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,51200,1.6325857374403212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,4096,0.12490310933854844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,2560,0.029353777567545574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,2048,0.024900444679790076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,3584,0.11003022061453925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,1536,0.019842666056421068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,3072,0.09544977876875137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,1024,0.014890667464998035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,2560,0.0809075567457411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,16384,0.5055679745144314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,2048,0.06567821900049846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,768,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,512,0.010009778042634329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,1536,0.05275555451711019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,256,0.007286222444640265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,1024,0.03843911157713996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,128,0.006263111200597551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,768,0.031509333186679415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,64,0.005585777676767773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,512,0.025118221839269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,32,0.005979555762476391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,256,0.02029333346419864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,128,0.018586667047606576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,64,0.018237334158685472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,32,0.018205333087179396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2560,7168,0.2288808822631836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,16384,0.1358320050769382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,12288,0.09206044673919678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,51200,0.3940604527791341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,10240,0.07948444286982219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,16384,0.47672711478339297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,8192,0.07340266969468859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,12288,0.36436798837449813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,7168,0.0603440006573995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,10240,0.3434133264753554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,6144,0.050717333952585854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,8192,0.2444995509253608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2560,6144,0.059454222520192467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,7168,0.21567822827233207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,4096,0.034048000971476235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,6144,0.18742667304144967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,3584,0.03092977735731337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,5120,0.14957777659098306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,3072,0.026932444837358262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,51200,1.4954107072618272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,4096,0.11740177207522923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,2560,0.02407377792729272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,2048,0.019765333996878732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,65536,0.4864817725287543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,3584,0.10389777686860825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,1536,0.015602666470739575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,1024,0.011607999602953592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,768,0.0096124443742964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,2560,0.0766542222764757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,512,0.0079644446571668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,65536,1.9107093811035156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,1536,0.04939022329118517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,1024,0.03491377830505371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,256,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,128,0.005671999934646819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,768,0.030027555094824895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,64,0.004971555537647671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,32,0.005246222019195557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,512,0.024004444479942322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,256,0.019278221660190158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,128,0.017235555582576327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,64,0.016902221573723685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,32,0.01680799987581041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,16384,0.10449600219726562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,65536,0.38471200731065536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,51200,0.3161697652604845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,12288,0.0778213342030843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,10240,0.06761866807937622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,16384,0.44694842232598203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,12288,0.3466506799062093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,3072,0.08932711018456353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,8192,0.052934222751193576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,2048,2048,0.06282666656706068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,7168,0.044850667317708336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,6144,0.03943199912707011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,5120,0.034070223569869995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,8192,0.2309910986158583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,7168,0.20049244827694365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,6144,0.1703733338250054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,4096,0.026591110560629103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,3584,0.023355555203225877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,5120,0.13971377743615046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,3072,0.02055377761522929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,2560,0.01811644434928894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,51200,1.383319960700141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,4096,0.1088835530810886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,3584,0.0967644453048706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,2048,0.015410666664441427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,1536,0.012891555825869242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,3072,0.08357689115736221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,1024,0.010048000348938836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,2560,0.0714577767584059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,768,0.008857777549160851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,512,0.007307555940416124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,2048,0.05814488728841146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,1536,0.04510666595564949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,256,0.005888000130653381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,1024,0.03253511256641812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,128,0.005617777920431561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,768,0.027759111589855615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,64,0.005254222287072076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,512,0.022452443838119507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1536,32,0.005222222043408289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,256,0.01792622274822659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,128,0.016196444630622864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,64,0.015815999772813585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,32,0.015476443701320224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,10240,0.2890968852572971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,65536,0.3011244402991401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,51200,0.21812800566355386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,16384,0.07239644394980536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,12288,0.05379288726382785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,10240,0.04536088969972399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,12288,0.319268438551161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,16384,0.44357599152459043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,10240,0.2689173221588135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,2048,5120,0.04344888859324985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,7168,0.03012266755104065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,6144,0.026769777139027912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1536,65536,1.7620969348483617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,5120,0.023899555206298828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,8192,0.22116711404588488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,7168,0.18946666187710234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,4096,0.019512888458040025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,6144,0.16160533163282606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,3584,0.01734133395883772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,3072,0.015791111522250705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,5120,0.13206311066945395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,4096,0.10328977637820774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,2560,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,51200,1.2919457753499348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,2048,0.011125333607196808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,3584,0.09058666891521877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,1536,0.009775111244784461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,3072,0.07971644401550293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,1024,0.00797155582242542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,768,0.007300444775157505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,2560,0.06660177972581652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,2048,0.05401510993639628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,65536,1.6539822684393988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,1536,0.041179554329978094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,512,0.006257777826653586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,1024,0.030825777186287776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,256,0.005256888767083486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,128,0.004518222063779831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,64,0.004181333300140169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,768,0.026036444637510512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,32,0.004234666625658671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,256,0.016537777251667447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,128,0.014882667197121514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,64,0.014455111490355598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,32,0.014474666780895658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,1024,8192,0.037463112009896174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,65536,0.21349688371022543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,16384,0.055867552757263184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,51200,0.17677156130472818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,12288,0.04616444309552511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,10240,0.03679022192955017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,8192,0.028307557106018066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,16384,0.40202755398220485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,10240,0.2561013433668348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,7168,0.026149332523345947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,8192,0.21006222565968832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,6144,0.022503111097547743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,5120,0.020038222273190815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,7168,0.18707911173502603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,4096,0.016961778203646343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,6144,0.15480355421702066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,5120,0.1256106694539388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,3584,0.015215999550289579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,3072,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,1024,512,0.02093155516518487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,4096,0.09802933533986409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,2560,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,2048,0.00981777740849389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,3584,0.08598133590486313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,51200,1.2354764938354492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,1536,0.008643555144468943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,3072,0.07517244418462117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,1024,0.006968888971540663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,2560,0.06290133131874932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,2048,0.05052177773581611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,512,0.0058986664646201665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,1024,0.029265777932273015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,65536,1.5734390682644313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,768,0.024696000748210486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,128,0.004522666749027041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,512,0.020291555258962844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,64,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,32,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,128,0.014440889159838358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,12288,0.3046782281663683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,64,0.013802666631009845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,32,0.013807999591032663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,65536,0.18636800183190239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,51200,0.14527289072672525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,16384,0.04891644583808052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,12288,0.03542133172353109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,16384,0.3909875551859538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,12288,0.2967528767055935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,10240,0.02902666727701823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,768,0.006235555642180973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,8192,0.022987556126382615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,1536,0.038796444733937584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,768,256,0.004883555488453971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,7168,0.02032088902261522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,6144,0.01776622235774994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,10240,0.2493413289388021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,768,256,0.01612622208065457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,8192,0.2005502250459459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,5120,0.015676443775494892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,4096,0.013167999684810638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,3584,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,7168,0.17621778117285836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,6144,0.15033245086669922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,51200,1.1950559616088867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,3072,0.011061333119869232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,5120,0.12211110856797959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,4096,0.09520622094472249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,2560,0.009705777797434065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,2048,0.00868266655339135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,3584,0.08285066816541883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,1024,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,65536,1.5265688366360133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,2048,0.04824089010556539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,768,0.005256888767083486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,1536,0.038367112477620445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,512,0.004595555365085602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,1024,0.028127110666698877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,256,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,128,0.0036880001425743103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,768,0.024047111471494038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,512,0.01959733333852556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,64,0.0033359999457995095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,256,0.015140444040298462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,32,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,128,0.013789333403110504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,64,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,65536,0.11554755104912652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,32,0.013003555436929068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,51200,0.09032889207204182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,16384,0.033391998873816595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,12288,0.02347733411524031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,16384,0.38016356362236875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,12288,0.2880800035264757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,512,1536,0.007316444483068254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,10240,0.019927110936906602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,8192,0.016010666886965435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,3072,0.07219644387563069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,7168,0.014930667148696052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,6144,0.013455111119482251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,8192,0.1950240002738105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,5120,0.012136889000733694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,7168,0.17035999563005236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,6144,0.14551111062367758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,4096,0.0099973330895106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,3584,0.009335999687512716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,51200,1.1588346693250868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,5120,0.11838044060601129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,3072,0.008630221916569604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,4096,0.09188799725638495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,2560,0.00778399987353219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,3584,0.08067378070619372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,2048,0.006575111299753189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,65536,1.4794577492607965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,1536,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,3072,0.06959199905395508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,2560,0.058543112542894155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,2048,0.04672444529003567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,768,0.004581333448489507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,1536,0.03598755598068237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,512,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,1024,0.02716355522473653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,768,0.023315555519527856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,512,0.019235556324323017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,128,0.0034888887570963967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,256,0.014768888552983602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,64,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,32,0.0031928889867332247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,128,0.01314933349688848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,64,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,65536,0.07264533307817247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,32,0.012548444171746572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,256,10240,0.24222310384114584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,16384,0.025377778543366328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,12288,0.01683022247420417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,12288,0.2803457842932807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,16384,0.37016889784071183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,10240,0.014546665880415173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,1024,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,8192,0.013395555317401886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,7168,0.012224888636006249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,256,256,0.0035502223504914176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,10240,0.23561334609985352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,6144,0.01108888867828581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,8192,0.1901031070285373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,5120,0.009665778113736046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,7168,0.16604710949791804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,4096,0.008186666501892937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,3584,0.00795377790927887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,512,2560,0.0606000026067098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,51200,1.128413306342231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,6144,0.14176177978515625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,3072,0.007247111035717859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,5120,0.11573867003122966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,2560,0.006568888823191325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,2048,0.005573333137565189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,3584,0.07835555738872953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,51200,0.06013511286841499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,1536,0.005208000126812193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,65536,1.4384151034884984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,3072,0.0673440032535129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,2560,0.057387557294633657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,768,0.0041946665280395085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,2048,0.045145776536729604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,512,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,1536,0.03499644332461887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,256,0.0032177778581778207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,1024,0.026703110999531213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,128,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,768,0.02269688910908169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,64,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,512,0.018225777480337355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,256,0.014152000347773233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,128,0.0127688886390792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,64,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,65536,0.07448622253206041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,32,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,51200,0.05463822351561653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,16384,0.018923555811246235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,12288,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,12288,0.27983376714918345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,10240,0.012314666476514606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,128,4096,0.08909244669808282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,8192,0.010684444672531553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,1024,0.004184000194072723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,7168,0.010056888891590966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,10240,0.23514223098754883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,8192,0.18978667259216309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,6144,0.010687111152542962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,128,32,0.0031431110368834603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,7168,0.16592710547977024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,51200,1.1287662718031142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,4096,0.007998222278224098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,3584,0.007322666545708974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,5120,0.11537155840131973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,65536,1.4379075368245442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,3072,0.006734222173690796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,4096,0.08893689182069565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,2560,0.005948444621430502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,3584,0.07819377713733248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,2048,0.005559111220969095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,1536,0.004919111314747068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,3072,0.06734133428997464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,2048,0.044806222120920815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,1024,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,1536,0.034640888373057045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,16384,0.36959287855360246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,1024,0.02671555512481266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,256,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,128,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,512,0.018546667363908555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,256,0.014157333307796054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,128,0.012087110843923358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,64,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,65536,0.07162933217154609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,5120,0.00924711094962226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,32,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,51200,0.056291553709242076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,16384,0.01662400033738878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,12288,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,6144,0.14184621969858804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,10240,0.010378667049937779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,16384,0.36960445510016543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,12288,0.27993777063157826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,2560,0.057202663686540395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,8192,0.009763555394278632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,10240,0.23516265551249185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,7168,0.009342222577995723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,6144,0.008674666285514832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,64,768,0.003914666672547658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,5120,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,4096,0.009485333330101436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,8192,0.18986222479078504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,7168,0.16615377532111272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,3584,0.00868000007337994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,6144,0.14098221725887722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,3072,0.007649777664078607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,2560,0.0069226668112807805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,4096,0.08865066369374593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,2048,0.005190222213665645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,3584,0.07841866546207003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,3072,0.0676142242219713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,1536,0.004509333521127701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,2560,0.05699377589755588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,1024,0.0041786668201287585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,2048,0.04533066683345371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,1536,0.03490133417977227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,1024,0.02645422187116411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,512,0.0033679999825027254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,65536,1.4418044620090062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,768,0.022669333550665114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,256,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,128,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,512,0.01831377711560991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,64,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,128,0.012406222522258759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,32,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,64,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,32,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,64,768,0.022350221872329712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,5120,0.11483911673227946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,51200,1.1268559561835396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3073,32,768,0.0036844445599450003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3073,32,256,0.014127999544143677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,12288,2.7885360717773438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,16384,3.7886488172743054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,16384,4.68510479397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,16384,4.0284809536404085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,12288,3.250828425089518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,10240,2.6484347449408636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,10240,2.7202559577094187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,12288,3.093272103203667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,8192,1.9651652442084417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,8192,2.076171451144748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,7168,1.6777057647705078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,10240,2.5629732343885636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,7168,1.7969040340847438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,8192,2.0484773847791886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,6144,1.434053315056695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,7168,1.8127155303955078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,51200,11.939153035481771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,6144,1.5499359766642253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,5120,1.1366418202718098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,4096,0.9887546963161893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,5120,1.288596471150716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,4096,1.0277893278333876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,5120,1.2860755920410156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,3584,0.7390169037712945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,4096,0.9963582356770834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,6144,1.576896031697591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,3584,0.8846595552232531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,3072,0.7612373563978406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,2560,0.5110684500800239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,3584,0.8904026879204644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,3072,0.7867911126878527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,2560,0.6490302085876465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,2048,0.4777377976311578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,3072,0.7429671287536621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,1536,0.3242231210072835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,2048,0.5625502268473307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,2560,0.6428284645080566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,1024,0.22414843241373697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,2048,0.5242915683322483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,1536,0.523731549580892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,768,0.18143555853101942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,1024,0.32541688283284503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,1536,0.41559910774230957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,512,0.14019289281633165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,768,0.26281687948438853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,1024,0.3282266722785102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,256,0.10662400060229832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,512,0.2141368918948703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,512,0.2082222170299954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,128,0.09192799859576756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,64,0.07438488801320393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,256,0.1916346682442559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,128,0.1263315545188056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,65536,32,0.07213866710662842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,128,0.17875999874538848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,64,0.1842177841398451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,32,0.1832488907708062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,768,0.2612382305992974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,256,0.1639066669676039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,65536,51200,19.59051683213976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,65536,51200,15.544504801432291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,16384,2.9898817274305554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,16384,3.693884531656901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,51200,9.327259487575954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,16384,3.392002741495768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,12288,2.5557342105441623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,65536,11.980381435818144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,12288,2.641753726535373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,10240,2.0195511711968317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,12288,2.5255955590142145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,10240,2.1386710272894964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,8192,1.4996293385823567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,51200,14.451987372504341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,10240,2.0532987382676864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,8192,1.7223261727227106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,7168,1.4814382129245336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,51200,11.124285380045572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,8192,1.6659235424465602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,7168,1.4582657284206813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,6144,1.2036302354600694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,7168,1.4251155853271484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,5120,1.0055226220024955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,5120,1.017012490166558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,4096,0.7501635551452637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,6144,1.1685262256198459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,4096,0.8522382312350802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,5120,1.0297644933064778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,6144,1.3322568469577365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,3584,0.682404465145535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,4096,0.7757760153876411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,65536,19.61410861545139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,3584,0.7074640062120227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,3072,0.532857788933648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,3072,0.7724355591668023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,2560,0.4730781979031033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,3584,0.6971173286437988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,3072,0.6025110880533854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,2560,0.5213813251919216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,2048,0.3590364456176758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,1536,0.2568275663587782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,2560,0.5369964705573188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,2048,0.5468799802992079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,1024,0.17658489280276826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,1536,0.3369751241472032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,2048,0.4248657756381565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,768,0.1435599989361233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,1024,0.2637866603003608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,1536,0.35289422671000165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,768,0.20164267222086588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,512,0.11059733231862386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,1024,0.2732337845696343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,768,0.22644088003370497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,256,0.07670755518807305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,512,0.17407555050320098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,512,0.18275022506713867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,256,0.1584293312496609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,256,0.13544355498419866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,128,0.14328266514672175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,128,0.10406488842434353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,32,0.06405778063668145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,64,0.14620978302425808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,128,0.06815999746322632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,51200,64,0.06123110983106825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,51200,32,0.1469351053237915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,16384,0.9049680497911242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,51200,3.0973307291666665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,16384,1.3828088972303603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,65536,4.145916408962674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,12288,0.6965466605292426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,16384,1.3473279741075304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,12288,1.0146915647718642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,10240,0.6203386518690321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,12288,1.010262171427409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,10240,0.838954660627577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,51200,5.317279815673828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,8192,0.49808533986409503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,65536,6.856929779052734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,51200,4.412594689263238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,8192,0.6585137579176161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,10240,0.8391964700486926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,7168,0.5018666585286459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,6144,0.3802311155531142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,65536,5.734595404730903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,7168,0.5938026640150282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,8192,0.6774080064561633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,5120,0.3207893371582031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,6144,0.4914684295654297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,7168,0.5986648665534126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,4096,0.250511990653144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,5120,0.4398231241438124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,3584,0.21450755331251356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,5120,0.4278346697489421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,6144,0.588705751630995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,4096,0.41085510783725315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,3584,0.3345022201538086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,4096,0.3428231080373128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,2560,0.14857067002190485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,3584,0.31059379047817653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,3072,0.2421635521782769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,3072,0.26832622951931423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,2048,0.11956622865464951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,2560,0.22304977311028373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,2560,0.22707109981113008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,1536,0.09354844358232285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,2048,0.1722186671362983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,2048,0.1896515554851956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,1536,0.14113244745466444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,1536,0.15605421861012778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,1024,0.10299022330178155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,512,0.03773599863052368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,768,0.09820977846781413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,512,0.06976711087756686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,512,0.08074133263693915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,256,0.05974666939841377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,3072,0.17665066983964708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,128,0.02409155501259698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,256,0.06256533331341214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,128,0.055937780274285205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,128,0.05097066693835788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,64,0.020852444900406733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,32,0.020981333321995203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,1024,0.06388355626000299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,64,0.05589333507749769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,16384,1024,0.11699999703301324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,32,0.05654399924808078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,256,0.028185778194003638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,16384,768,0.05456088980038961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,16384,768,0.08465688758426243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,65536,2.746761745876736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,51200,2.38954226175944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,16384,0.7341146469116211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,12288,0.5988355742560493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,16384,1.1169502470228407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,16384,1.1561191346910265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,12288,0.8790035777621799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,10240,0.47003645367092556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,12288,0.8483857578701444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,8192,0.36099643177456325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,51200,4.324078030056424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,65536,5.715529971652561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,10240,0.6793546676635742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,7168,0.3218844466739231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,10240,0.7525759802924262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,7168,0.47016355726453996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,8192,0.5883333418104384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,51200,3.729566362169054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,6144,0.2829013400607639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,8192,0.6017297638787164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,5120,0.23850666152106392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,6144,0.401854223675198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,4096,0.17581421799129912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,7168,0.5482488738165961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,5120,0.38541422949896914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,6144,0.4508648978339301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,5120,0.3649386564890544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,3584,0.15991644064585367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,4096,0.2607564396328396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,3072,0.13751999537150064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,3584,0.23921333418952095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,3584,0.26088089413113064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,3072,0.20264621575673422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,4096,0.38080265786912704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,3072,0.22827111350165474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,2048,0.0891573362880283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,65536,4.734017690022786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,1536,0.0680533316400316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,2560,0.17241866058773467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,2560,0.19577866130405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,2048,0.14510667324066162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,1024,0.047694222794638745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,2048,0.16285422113206652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,768,0.03868888815244039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,1536,0.13407822450002035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,1536,0.11197511355082194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,1024,0.08499199814266628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,1024,0.10396799776289199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,512,0.030066665675905015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,768,0.06783911254670885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,256,0.02273066673013899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,768,0.08558666706085205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,128,0.020101333657900494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,512,0.07022666931152344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,256,0.04869066675504049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,256,0.05459733472930061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,64,0.017062221964200337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,128,0.04485866758558485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,12288,128,0.044679999351501465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,32,0.01684711045689053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,32,0.04549955659442478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,64,0.04510755671395195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,12288,2560,0.10926666524675156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,12288,512,0.05753511190414429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,16384,0.6551600032382542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,51200,2.000159157647027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,65536,2.719601737128364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,16384,1.038958231608073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,12288,0.4938720067342122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,16384,1.0277901755438912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,12288,0.7126071188184949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,51200,3.779333326551649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,10240,0.4045822090572781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,12288,0.7934560245937772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,8192,0.3327973418765598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,10240,0.5957226753234863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,51200,3.308137681749132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,7168,0.28048621283637154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,65536,4.929764641655816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,10240,0.653796460893419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,8192,0.4783653153313531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,7168,0.4283528857760959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,6144,0.23549156718783906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,8192,0.552619563208686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,65536,4.204518212212457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,5120,0.19001689222123888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,6144,0.36078667640686035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,6144,0.39780354499816895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,4096,0.15274222691853842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,7168,0.48367468516031903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,5120,0.3442151016659207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,4096,0.2332915465037028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,3584,0.14271999730004206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,4096,0.26747910181681317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,3072,0.11461333433787028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,3584,0.22979556189643013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,3584,0.2396399974822998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,3072,0.17751733462015787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,3072,0.2137768930859036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,2560,0.15808710787031385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,2048,0.07589333587222628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,1536,0.06319466564390394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,2560,0.17782399389478895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,2048,0.12696088684929743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,2048,0.15336444642808703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,1024,0.044180442889531456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,1536,0.1210133367114597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,768,0.03169688913557265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,1024,0.09280533260769314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,768,0.06086577971776327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,768,0.07779288954204984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,512,0.023561777340041265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,5120,0.33430133925543887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,512,0.05006844467586941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,512,0.06449866957134671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,256,0.019307555423842538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,128,0.016605334149466622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,2560,0.09938844707277085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,256,0.04900799857245552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,256,0.04166133205095927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,64,0.01666755477587382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,10240,128,0.04115733173158433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,10240,32,0.017186666528383892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,64,0.036991112762027316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,32,0.03668355610635545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,1536,0.09960711002349854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,1024,0.07800622118843926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,10240,128,0.03837955660290188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,16384,0.5071324242485894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,65536,2.075768788655599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,51200,1.778432846069336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,12288,0.4226248794131809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,16384,0.8710684246487088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,16384,0.9536168840196398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,51200,3.2031769222683377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,10240,0.32931023173862034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,12288,0.7102710935804578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,8192,0.2690568765004476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,65536,3.9747127956814237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,51200,2.948557323879666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,10240,0.5395609007941352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,7168,0.2358808782365587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,8192,0.43772000736660427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,10240,0.638687981499566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,12288,0.6877653333875867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,7168,0.3695475525326199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,8192,0.5023671256171333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,65536,3.8086925082736545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,5120,0.1613831122716268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,6144,0.31849511464436847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,7168,0.4616604381137424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,6144,0.3659706645541721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,4096,0.1297946638531155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,5120,0.2591182125939263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,3584,0.1152320040596856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,4096,0.2008462217119005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,5120,0.31263555420769584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,3072,0.10007377465565999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,3584,0.1785422166188558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,4096,0.2561448944939507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,2560,0.08033155732684664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,2048,0.06752000252405803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,3072,0.1553244458304511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,3072,0.19216267267862955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,2560,0.13587733109792074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,2560,0.16506132814619276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,1536,0.04860799842410617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,1024,0.0343777769141727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,2048,0.11662756072150336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,2048,0.13767200046115452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,768,0.02791022260983785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,1536,0.11152088642120361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,1536,0.08847644593980576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,6144,0.19108800093332926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,1024,0.0665244460105896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,512,0.0206631107462777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,1024,0.09061333205964829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,256,0.01626399987273746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,768,0.05304000112745497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,768,0.07146666447321574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,512,0.042909334103266396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,128,0.013384888569513956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,512,0.0595102243953281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,256,0.0347999996609158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,64,0.012138666378127204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,256,0.045660446087519325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,8192,32,0.0129466669427024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,128,0.03196177879969279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,128,0.03753955496682061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,64,0.03172533379660712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,8192,32,0.03141422073046366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,8192,3584,0.21848621633317736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,16384,0.4816151195102268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,51200,1.5220781962076824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,16384,0.8146728939480252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,65536,2.007200029161241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,12288,0.3457333246866862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,16384,0.9086017608642578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,12288,0.6153617964850532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,51200,2.8618479834662547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,10240,0.27462932798597545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,10240,0.49482133653428817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,51200,2.8131368425157337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,12288,0.6810506714714898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,65536,3.7422637939453125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,8192,0.2289146582285563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,7168,0.19372355937957764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,10240,0.608932442135281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,8192,0.3873822159237332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,6144,0.16931466261545816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,7168,0.35549155871073407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,65536,3.5978062947591147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,8192,0.46341244379679364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,6144,0.2905706564585368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,5120,0.13264977931976318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,4096,0.10639822483062744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,6144,0.3547875616285536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,5120,0.24372267723083496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,5120,0.29154666264851886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,3584,0.0972248911857605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,3072,0.08091466956668429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,4096,0.23507822884453666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,2560,0.0707555545700921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,3584,0.16475733121236166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,3584,0.20811466375986734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,3072,0.1446053319507175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,3072,0.1834346718258328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,2048,0.057087997595469155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,1536,0.04339111182424757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,2560,0.12473866674635146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,2560,0.15631732675764295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,2048,0.13128711117638484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,1024,0.03144800000720554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,1536,0.08194755845599704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,768,0.023023110296991136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,1024,0.06145955456627739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,1024,0.08160889148712158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,7168,0.4147431055704753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,512,0.018219555417696636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,768,0.04891555507977804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,768,0.06849066416422527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,256,0.018364444375038147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,512,0.056913779841529004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,512,0.03939822316169739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,128,0.016192888220151264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,4096,0.18856888347201875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,256,0.04383288820584615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,256,0.03184266553984748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,64,0.015096889601813423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,7168,32,0.015795555379655626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,128,0.03417155477735732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,64,0.029467556211683486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,32,0.028775112496482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,2048,0.10344266891479492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,7168,1536,0.10672711001502143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,51200,1.0564515855577257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,7168,128,0.029280887709723577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,65536,1.499583986070421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,16384,0.3717377715640598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,12288,0.28039733568827313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,16384,0.7222080230712891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,16384,0.8537431293063693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,12288,0.6019564204745823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,12288,0.6289066738552517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,10240,0.24544445673624674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,8192,0.18932533264160156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,51200,2.5997127956814237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,10240,0.4554737938774957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,65536,3.249160978529188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,7168,0.17070221900939941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,10240,0.5284470982021755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,8192,0.40678755442301434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,8192,0.4334088961283366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,6144,0.14306044578552246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,7168,0.3233484427134196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,51200,2.5725813971625433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,5120,0.11905599964989556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,7168,0.3787626690334744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,6144,0.33396087752448184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,4096,0.09261244535446167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,5120,0.22291734483506945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,3584,0.0792328914006551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,65536,3.2792000240749783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,6144,0.3261306550767687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,5120,0.2693191104465061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,3072,0.06658133533265856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,4096,0.17331733968522814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,4096,0.21941867139604357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,2560,0.055052445994483105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,3584,0.152803553475274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,3584,0.20225600401560465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,3072,0.13190933068593344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,3072,0.16901332802242705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,1536,0.03314222229851617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,2560,0.11541599697536892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,2560,0.1462471087773641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,1024,0.026147555973794725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,2048,0.0954657793045044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,2048,0.12775911225212946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,768,0.021152888735135395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,1536,0.09888533088896011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,1536,0.07601155837376912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,512,0.01536622146765391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,1024,0.05624622106552124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,1024,0.07607466644710965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,256,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,768,0.0636791123284234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,512,0.053447110785378345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,512,0.03596177697181702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,128,0.011122666299343109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,256,0.029169778029123943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,64,0.009706666900051964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,128,0.033187554942237005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,32,0.009825777676370408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,64,0.026760889424218073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,32,0.026390223039521113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,6144,2048,0.04638755652639601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,768,0.044864889648225575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,6144,256,0.0411119990878635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,6144,128,0.027087999714745417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,65536,1.2612169053819444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,16384,0.347595559226142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,51200,1.066878212822808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,16384,0.6980346573723687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,12288,0.24982311990525988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,12288,0.4945537779066298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,65536,2.9276267157660594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,10240,0.20219822724660239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,12288,0.6160497665405273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,51200,2.310624016655816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,51200,65536,14.284637451171875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,8192,0.16940177811516655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,10240,0.4156915611690945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,7168,0.14912354946136475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,8192,0.3353875478108724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,10240,0.5184079806009928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,6144,0.12427732679578994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,7168,0.29033422470092773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,51200,2.446398205227322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,65536,3.1150230831570096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,5120,0.10944800244437324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,7168,0.37767555978563094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,4096,0.09150399764378865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,6144,0.24899554252624512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,16384,0.8426417774624295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,8192,0.4777848985460069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,6144,0.309279998143514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,5120,0.20233244366115996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,5120,0.256893343395657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,4096,0.15938488642374674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,3072,0.06427733103434245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,4096,0.2071208953857422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,3584,0.139430218272739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,3584,0.18648621771070692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,2048,0.044681777556737266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,3072,0.16132267316182455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,2560,0.1041217777464125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,1536,0.035177777210871376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,2560,0.1379893355899387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,2048,0.11555288897620307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,2048,0.08931199709574382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,1024,0.02598222262329525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,768,0.019132445255915325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,1536,0.0943831139140659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,1536,0.06897955470614962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,512,0.016138666205936007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,1024,0.07287555270724826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,1024,0.05111022127999199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,256,0.012479110724396177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,768,0.0610133343272739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,512,0.04936000042491489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,512,0.03263911273744371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,128,0.010703110860453712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,256,0.03763822383350796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,64,0.009082666701740688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,128,0.024502222736676533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,5120,128,0.03246488836076524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,32,0.009018667042255402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,3584,0.0730231139394972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,64,0.02450399928622776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,32,0.024195555183622573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,5120,2560,0.05262310968505012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,3072,0.12170222070482041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,768,0.041499555110931396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,51200,0.744692431555854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,65536,1.06585693359375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,5120,256,0.02642044425010681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,16384,0.27329333623250324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,12288,0.20153510570526123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,16384,0.631806214650472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,12288,0.4501155747307672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,10240,0.16794310675726998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,12288,0.5746160083346897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,16384,0.7783910963270398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,10240,0.377167993121677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,8192,0.1402613321940104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,51200,2.0110658009847007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,8192,0.3039626545376248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,7168,0.11486221684349908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,10240,0.4813946617974176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,6144,0.10264888736936782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,8192,0.38953065872192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,65536,2.5841876135932074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,5120,0.08030488755967882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,7168,0.2647475666469998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,7168,0.3431706693437364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,6144,0.22556800312466094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,51200,2.3129865858289933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,4096,0.06675289074579875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,6144,0.29407111803690594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,3584,0.05483022332191467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,5120,0.18593155013190377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,5120,0.24360977278815377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,4096,0.14433066050211588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,3072,0.047687109973695546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,4096,0.19637510511610243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,3584,0.12780622641245523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,3584,0.1741013394461738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,3072,0.1103831132253011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,2048,0.03484444485770331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,3072,0.15284266736772326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,65536,2.949857711791992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,1536,0.02715377840730879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,2560,0.09505244758394028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,1024,0.019733332925372653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,2048,0.10998755693435669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,2048,0.07620888948440552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,768,0.016502221425374348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,1536,0.06212977568308512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,1536,0.08922044436136882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,512,0.012264889147546558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,1024,0.06921155585183038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,768,0.03772355450524224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,768,0.05778400103251139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,512,0.030079109801186457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,512,0.046925332811143666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,128,0.010131555298964182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,256,0.024344889654053584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,256,0.03564000129699707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,64,0.009671111073758867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,128,0.022277333670192297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,128,0.030159999926884968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,32,0.010000000397364298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,64,0.022014222211307947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,32,0.02166666587193807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,2560,0.04007110993067423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,4096,2560,0.13044799698723689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,4096,1024,0.046372443437576294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,4096,256,0.010758221977286868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,65536,0.937196413675944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,16384,0.2268079916636149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,12288,0.17406311300065783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,16384,0.5849235322740343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,12288,0.424469338523017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,16384,0.7188462151421441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,10240,0.15090221828884548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,51200,0.7163910865783691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,12288,0.5481955740186903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,8192,0.11549244986640082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,10240,0.3576070997450087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,51200,1.9052594502766926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,7168,0.10220888588163589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,65536,2.438683615790473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,10240,0.45819467968410915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,8192,0.286826663547092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,6144,0.08919199970033433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,7168,0.2516373263465034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,5120,0.0803804463810391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,8192,0.37099822362263996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,7168,0.32615023189120823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,4096,0.0621066689491272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,6144,0.2140337758594089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,6144,0.27996622191535103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,5120,0.17617066701253256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,3584,0.055769774648878306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,5120,0.23208355903625488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,3072,0.04701333244641622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,4096,0.1381022267871433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,4096,0.18672177526685926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,51200,2.1993910471598306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,2560,0.04056533177693685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,3584,0.12143554952409531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,3584,0.16599022017584905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,2048,0.03356444504525926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,3072,0.10597866773605347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,3072,0.1454604466756185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,1536,0.028283556302388508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,2560,0.0904088881280687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,1024,0.020261334048377145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,2048,0.0735128919283549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,2048,0.10540444321102566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,1536,0.059157331784566246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,1536,0.08541422420077854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,768,0.017122666041056316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,1024,0.04315377937422859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,512,0.014761777387724983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,768,0.03567022085189819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,768,0.05414933297369215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,256,0.00923466682434082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,512,0.04452888833151924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,128,0.008079999850855933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,256,0.02288977801799774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,256,0.03571022219128079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,64,0.007158222297827403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,128,0.020970667401949566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,128,0.029574222034878198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3584,32,0.009302222066455418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,64,0.020575111111005146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,32,0.020633776982625324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,65536,2.805478201972114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,2560,0.12462577554914687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,65536,0.6900231043497721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3584,1024,0.06610400146908231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3584,512,0.028265777561399672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,16384,0.17614489131503633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,16384,0.534054226345486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,12288,0.13293245103624132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,16384,0.6822373072306315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,10240,0.12072977754804824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,12288,0.4035164515177409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,51200,0.4856302473280165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,12288,0.5170728895399306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,51200,1.7602275212605794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,10240,0.3393093215094672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,8192,0.10434844758775498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,65536,2.267911911010742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,7168,0.0828346676296658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,10240,0.43560089005364316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,6144,0.0700133310423957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,8192,0.2720195452372233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,7168,0.23813332451714408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,5120,0.05473777651786804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,8192,0.3531200091044108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,6144,0.20279022057851157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,4096,0.048933333820766874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,6144,0.26581332418653697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,3584,0.039423998859193586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,5120,0.16646844810909694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,5120,0.22057778305477568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,4096,0.13099822733137342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,4096,0.17758844958411324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,51200,2.0842274559868708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,3584,0.11504977279239231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,2560,0.03018488817744785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,3072,0.10027911265691121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,3072,0.1384213368097941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,2048,0.02458311120669047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,2560,0.11889244450463189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,1536,0.02014844450685713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,2048,0.06950133376651339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,2048,0.10014488961961533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,1024,0.014771555860837301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,1536,0.05346133311589559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,1536,0.08136889007356432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,768,0.012472000386979846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,1024,0.04112889038191901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,1024,0.06332888868119982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,512,0.009654222263230218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,768,0.05119555526309543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,768,0.03296355406443278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,256,0.007638221813572778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,512,0.02680533296532101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,512,0.04277688927120633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,128,0.0069297779765393995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,3072,0.03453244434462653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,65536,2.663956536187066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,64,0.006350222147173352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,3584,0.15779022375742593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,128,0.02918133470747206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,3072,32,0.0064693333374129395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,64,0.01956977778010898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,32,0.019208888212839764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,2560,0.08531555864546035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,65536,0.5715866618686253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,51200,0.48620886272854275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,7168,0.31188445621066624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,16384,0.17058222823672822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,256,0.02164266672399309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,3072,256,0.03502755694919162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,3072,128,0.019702222612169053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,12288,0.12694844934675428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,16384,0.5029164420233833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,10240,0.11022310786777073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,12288,0.3797760009765625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,16384,0.6792933146158854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,12288,0.5148248672485352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,8192,0.0903279980023702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,10240,0.3191644350687663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,7168,0.07629866732491387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,65536,2.0514195760091147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,10240,0.4333208931816949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,8192,0.2570506731669108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,51200,1.6009848912556965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,6144,0.06561599837409125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,8192,0.35084443622165257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,5120,0.0546284450425042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,7168,0.22569245762295195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,6144,0.19243110550774467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,7168,0.30833689371744794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,4096,0.04364711046218872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,6144,0.2643848790062798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,5120,0.1577662229537964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,3584,0.03941422369745042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,5120,0.21921688980526396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,4096,0.12450755967034234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,3072,0.03398666779200236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,3584,0.1093368861410353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,3584,0.1569582223892212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,51200,2.069730758666992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,65536,2.6439270443386502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,2048,0.025059555967648823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,3072,0.1374737819035848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,3072,0.09421777725219727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,1536,0.01993688941001892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,2560,0.07972444428337945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,2560,0.11732621987660725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,1024,0.015089778436554803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,2048,0.0990613301595052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,2048,0.06470577584372626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,768,0.011581333147154914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,1536,0.08096000221040514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,1024,0.037949333588282265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,1024,0.06230311261283027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,512,0.009649777577983009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,768,0.030936890178256567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,768,0.0510808891720242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,256,0.007592000067234039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,512,0.025369778275489807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,512,0.04215822286076016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,128,0.006664000037643645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,256,0.02029333346419864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,256,0.033096889654795326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,64,0.00656444455186526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,32,0.006583999842405319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,128,0.02814133299721612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,128,0.018577777677112155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,64,0.017916444275114272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,32,0.018204443984561496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2560,4096,0.17671733432345918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2560,2560,0.028664890262815688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,65536,0.49437422222561306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,51200,0.3997928831312392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,16384,0.1363324456744724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2560,1536,0.052073776721954346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,12288,0.09976889027489556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,16384,0.4834453264872233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,12288,0.3595137861039903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,10240,0.08974844217300415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,16384,0.6866088973151313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,8192,0.07178488704893324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,51200,1.4954008526272242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,12288,0.488667541080051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,10240,0.3023715549045139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,7168,0.06063999732335409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,10240,0.4097786744435628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,8192,0.24478933546278211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,65536,1.9106818305121527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,6144,0.053892443577448525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,5120,0.04309689005215963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,7168,0.2136791149775187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,8192,0.33275556564331055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,7168,0.29314398765563965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,4096,0.03545866741074456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,6144,0.1824328899383545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,6144,0.25062399440341526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,3584,0.03035022152794732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,5120,0.1492497788535224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,5120,0.20762577321794298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,3072,0.027943111128277246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,51200,1.9568523830837672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,4096,0.1169466707441542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,4096,0.16682044665018717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,2560,0.023451555106374953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,3584,0.1485608948601617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,3584,0.10244533088472153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,2048,0.019159111711714003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,3072,0.08950577841864692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,3072,0.13059643904368082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,2560,0.11226044760810004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,2048,0.093922668033176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,65536,2.499237272474501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,1536,0.0754622220993042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,1536,0.048357334401872426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,768,0.009445333646403419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,1024,0.03496088915401035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,512,0.00794222205877304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,768,0.029472000069088403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,768,0.048743999666637845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,256,0.0068959999415609576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,512,0.023933332827356126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,256,0.0188773340649075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,128,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,256,0.03223911258909438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,128,0.017235555582576327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,128,0.02716711163520813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,64,0.005578666511509154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,64,0.016872000363137987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,32,0.0058266665372583605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,1536,0.014151111245155334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,2560,0.07646577888064914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,2048,1024,0.010732444624106089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,32,0.016857778032620747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,1024,0.05880177683300442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,65536,0.4078497886657715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,51200,0.3023955557081434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,2048,512,0.040135112073686384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,16384,0.10354844729105632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,16384,0.445126215616862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,12288,0.07287022140291002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,16384,0.6191288630167643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,2048,2048,0.06310755676693387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,10240,0.060883555147382945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,12288,0.33750579092237687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,51200,1.3778097364637587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,8192,0.05207911133766174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,10240,0.28329867786831325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,65536,1.7556435267130535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,7168,0.04012088974316915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,10240,0.3867448965708415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,8192,0.22845066918267143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,8192,0.31358133422003853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,6144,0.03498844305674235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,7168,0.19999910725487602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,5120,0.029733333322736952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,51200,1.8424097696940105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,7168,0.27682044770982533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,6144,0.17073955800798205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,6144,0.23722399605645073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,65536,2.352633794148763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,5120,0.13918311066097683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,3584,0.02312177750799391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,5120,0.19491822189754912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,4096,0.10901244481404622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,3072,0.02019466625319587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,4096,0.15700444910261366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,3584,0.09564977884292603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,2560,0.01717866626050737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,3584,0.1395662228266398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,2048,0.014492443866199918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,3072,0.08346399996015762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,3072,0.12276000446743435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,12288,0.46155468622843426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,2560,0.07105866405698988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,2048,0.0892382197909885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,1024,0.009326222042242685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,2048,0.05812266800138685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,768,0.00832622249921163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,1536,0.04482577906714546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,1024,0.05589510997136434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,1024,0.032666666640175715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,512,0.006923555499977536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,768,0.027072888281610277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,768,0.04604088928964403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,256,0.005344888816277186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,512,0.03844533363978068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,512,0.022355554832352534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,128,0.004885333279768626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,256,0.03052177694108751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,256,0.017867555220921833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,64,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,32,0.00452888881166776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,128,0.016169778174824186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,4096,0.02477333280775282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,64,0.015791111522250705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1536,32,0.015480889214409722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,65536,0.28764179017808705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,51200,0.21360088719262016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,2560,0.10525866349538167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1536,1536,0.012150222228633033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,16384,0.07480622000164457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,1536,0.07243021991517809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,12288,0.05424355467160543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,16384,0.42082754770914715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1536,128,0.026025777061780293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,12288,0.3191653357611762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,10240,0.04548355605867174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,16384,0.6023884349399143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,8192,0.03712977634535895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,12288,0.4569466908772786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,10240,0.26804089546203613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,51200,1.2983378304375541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,7168,0.03183111217286851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,8192,0.21575378047095406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,65536,1.650686264038086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,10240,0.38483556111653644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,6144,0.026477333572175767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,5120,0.022658665974934895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,7168,0.18925955560472277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,8192,0.3121733400556776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,6144,0.16122489505343968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,7168,0.27482488420274526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,4096,0.019700444406933255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,3584,0.017352888981501263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,6144,0.235060453414917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,5120,0.19410310851203072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,51200,1.833115471733941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,4096,0.1026960015296936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,4096,0.15672177738613552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,3072,0.015656888484954834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,3584,0.0904195573594835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,3584,0.13948799504174128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,2560,0.013374221821626028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,2048,0.01144266708029641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,65536,2.342280069986979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,3072,0.12178756131066217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,2560,0.06696533494525485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,1536,0.009716444545321995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,2560,0.10475289159350926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,2048,0.05407289001676771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,1024,0.007647111184067196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,2048,0.08727466397815281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,1536,0.07198755608664618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,1536,0.04098133246103922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,768,0.006993778049945831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,1024,0.05393955442640516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,1024,0.03055822186999851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,768,0.04553866717550489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,768,0.025621333056026038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,256,0.0046693334976832075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,512,0.03835377759403653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,512,0.020984888076782227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,128,0.004568888909286923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,256,0.029845333761639063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,256,0.016529776983790927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,64,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,128,0.014783999986118741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,1024,128,0.02572800053490533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,32,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,5120,0.13140889008839926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,64,0.014480888843536377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,32,0.014212444424629211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,65536,0.2253368960486518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,51200,0.1685484382841322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,16384,0.05446844299634298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,1024,3072,0.07893866962856717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,1024,512,0.00591111100382275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,16384,0.40976889928181964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,12288,0.041815999481413096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,16384,0.5662950939602321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,10240,0.03544888893763224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,12288,0.30877333217196995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,12288,0.43054665459526914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,51200,1.2322417365180123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,8192,0.027042667071024578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,10240,0.25604621569315594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,65536,1.5711759991115992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,7168,0.022456000248591106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,10240,0.36248265372382266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,8192,0.20629689428541395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,6144,0.01995111174053616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,8192,0.29401156637403697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,7168,0.1802977720896403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,5120,0.01703644461101956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,7168,0.25887465476989746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,4096,0.014888889259762235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,51200,1.719856897989909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,6144,0.1542266607284546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,6144,0.22199111514621309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,3584,0.012661333713266583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,5120,0.12588000297546387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,3072,0.011361777782440186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,5120,0.18281422721015084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,2560,0.010288889209429422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,4096,0.09787022405200535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,4096,0.14781510829925537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,3584,0.08546933200624253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,65536,2.194631152682834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,3584,0.1315279934141371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,2048,0.009001777403884465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,3072,0.11526044209798177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,3072,0.07481333282258776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,1536,0.007907555335097844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,1024,0.006232888748248418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,2560,0.0637306637234158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,2560,0.09913244512346055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,768,0.005581333405441708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,2048,0.050322665108574756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,2048,0.08301511075761583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,1536,0.0662977761692471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,512,0.004871110949251386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,1024,0.029507554239696924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,1024,0.051128000020980835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,256,0.004232888834344016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,128,0.0038168889780839286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,768,0.02462933295302921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,768,0.04351910948753357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,64,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,512,0.03678755627738105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,256,0.028811554114023846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,768,32,0.003683555457327101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,256,0.015692444311247934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,768,128,0.024333332975705464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,128,0.014164444473054675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,64,0.013760888742076026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,32,0.013734222286277346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,65536,0.1614497767554389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,51200,0.12728088431888157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,16384,0.042450666427612305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,16384,0.3905866675906711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,1536,0.03901955485343933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,12288,0.03259733319282532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,768,512,0.020241777102152508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,51200,1.1950968636406791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,16384,0.5646977954440647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,10240,0.025616889198621113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,12288,0.2961431079440647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,8192,0.020040889581044514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,65536,1.5242862701416016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,12288,0.42854756779140896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,10240,0.2490168942345513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,7168,0.017879999346203275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,8192,0.2007573313183255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,10240,0.36095555623372394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,6144,0.016270221935378183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,8192,0.2926417721642388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,51200,1.7136302524142797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,5120,0.013966222604115805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,7168,0.1757964425616794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,7168,0.25780177116394043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,6144,0.14990933736165366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,6144,0.22069333659278023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,65536,2.1886026594373917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,3584,0.010944888823562197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,5120,0.18187644746568468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,3072,0.01000355515215132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,4096,0.09480533334943984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,4096,0.14714488718244764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,2560,0.008976889153321585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,3584,0.13112889395819768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,3584,0.08313777711656359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,3072,0.0722222195731269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,2048,0.007606222397751278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,2560,0.06121955315272013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,2560,0.09828088680903117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,1536,0.00665155549844106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,2048,0.08371377653545803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,2048,0.048504001564449735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,1024,0.005570666657553778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,1536,0.0669155584441291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,1536,0.03787911269399855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,768,0.004915555732117759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,1024,0.028099556763966877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,512,0.004464888738261329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,1024,0.05048622356520759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,256,0.00425155543618732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,768,0.042929778496424355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,512,0.03610666592915853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,512,0.019508444600635104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,128,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,256,0.015461333923869662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,256,0.028204444381925795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,4096,0.012082666986518435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,64,0.0038648889296584656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,512,32,0.0038897775941424896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,128,0.013453333742088742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,5120,0.12202133072747125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,64,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,32,0.013060444758998023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,65536,0.09934755828645493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,51200,0.08475289079878066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,16384,0.031075557072957356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,3072,0.11475111378563775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,16384,0.3791217803955078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,12288,0.02772088845570882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,512,768,0.02369511127471924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,16384,0.5596239831712511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,10240,0.022675555613305833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,12288,0.28720000055101186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,512,128,0.02366399930583106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,51200,1.1594844394259982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,8192,0.019350222415394254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,10240,0.2417315642038981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,12288,0.42558754814995664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,7168,0.016357334123717416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,8192,0.19496444861094156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,10240,0.35805333985222715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,6144,0.014762666490342883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,8192,0.29041955206129283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,5120,0.013038222160604266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,7168,0.17121333546108672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,7168,0.2557697825961643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,4096,0.009018667042255402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,6144,0.145797332127889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,6144,0.21887466642591688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,5120,0.11849599414401585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,5120,0.1804435518052843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,4096,0.09151555432213677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,65536,2.1694728003607855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,3072,0.007617777420414819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,3584,0.08103111055162218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,3584,0.1296079953511556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,2560,0.0069217777086628815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,3072,0.11342310905456543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,3072,0.0701448917388916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,2048,0.00600000015563435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,2560,0.05917866362465752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,2560,0.0968959993786282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,1536,0.005576000031497743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,2048,0.04657599992222256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,2048,0.08172621991899279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,65536,1.4780399534437392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,1024,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,1536,0.036510222487979464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,768,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,1536,0.0647031135029263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,1024,0.050343109501732715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,512,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,51200,1.7001493242051866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,512,0.018937778141763475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,256,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,512,0.03565688927968343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,3584,0.00832444429397583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,128,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,256,0.027785778045654297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,256,0.014782221780882942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,4096,0.14521422651078966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,64,0.0032053333189752367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,128,0.013080889152155982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,128,0.02334311107794444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,64,0.012794666820102267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,65536,0.07156178024080065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,32,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,51200,0.05830844243367513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,1024,0.027406222290462915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,256,768,0.022981334063741896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,16384,0.02149244480662876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,256,32,0.0035297779573334586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,16384,0.36989866362677676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,12288,0.014184888866212634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,51200,1.129058625962999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,65536,1.4402435090806749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,10240,0.012656889028019376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,12288,0.28032978375752765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,16384,0.5579244295756022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,8192,0.012876444392734103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,12288,0.4246959951188829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,10240,0.2355395687950982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,256,768,0.042103111743927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,7168,0.011733333269755045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,10240,0.35718133714463973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,8192,0.1897804472181532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,6144,0.01198933356338077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,65536,2.1654915279812283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,5120,0.010684444672531553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,7168,0.16661066479153103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,8192,0.2897973325517443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,51200,1.6959359910753038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,7168,0.25586043463812935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,3584,0.008281778130266402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,6144,0.2187662257088555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,5120,0.11530933115217422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,5120,0.18047022819519043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,4096,0.08888800276650323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,4096,0.14506133397420248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,3072,0.007522666619883643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,2560,0.006621333460013072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,3584,0.07812622520658705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,2048,0.005598222215970357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,3584,0.12895822525024414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,3072,0.06755110952589247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,2560,0.05678666962517632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,1536,0.005055111315515307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,2560,0.09677955839369033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,1024,0.004239999999602635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,2048,0.045422222879197865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,1536,0.034635557068718806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,1536,0.0653102199236552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,768,0.0042151109211974675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,1024,0.026660444007979497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,1024,0.05003289050526089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,512,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,768,0.02234755622016059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,768,0.04207377632459005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,256,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,512,0.03495111068089803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,128,0.0031893334041039148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,256,0.014121777481502958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,256,0.027464000715149775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,64,0.0030008889734745026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,4096,0.009007111191749573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,128,0.01218844453493754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,128,0.023026666707462732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,128,32,0.0032239999208185407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,6144,0.14174311690860325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,64,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,65536,0.06907911433113946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,51200,0.05522133244408501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,16384,0.018358222312397428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,32,0.0118222220076455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,12288,0.0165928883685006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,10240,0.014522666732470194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,3072,0.11272088686625163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,8192,0.012753778033786349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,12288,0.2797093391418457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,3072,128,2048,0.0817048880789015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,10240,0.23500177595350477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,7168,0.012075555821259817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,6144,0.01074488874938753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,8192,0.1897066699133979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,5120,0.008957333034939235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,7168,0.1661048862669203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,6144,0.14152355988820395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,128,512,0.018537777993414137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,3584,0.007304888632562425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,5120,0.11499999629126655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,3072,0.006566222343179915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,4096,0.08852622244093154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,3584,0.07770844300587972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,2560,0.005965333431959152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,51200,1.1273493236965604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,2048,0.005314666777849197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,1536,0.004853333450025982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,3072,0.06828977664311726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,1024,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,2560,0.05653599898020426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,2048,0.04481155673662821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,65536,1.4424044291178386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,768,0.0038844446341196695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,1536,0.034508443540996976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,512,0.0035742223262786865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,256,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,128,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,1024,0.026512000295850966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,768,0.02234399980968899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,64,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,512,0.018530666828155518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,32,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,256,0.014087999860445658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,128,0.012227555943859948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,65536,0.06778666708204481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,16384,0.3692355685763889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,64,0.012074666718641916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,64,32,0.012042666474978128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,51200,0.051408890220854014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,16384,0.01641688909795549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,12288,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,10240,0.00998044427898195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,8192,0.00867377801073922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,64,4096,0.0076453329788313965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,7168,0.008573333422342936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,12288,0.27975379096137154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,10240,0.23528711001078287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,16384,0.36952800220913357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,6144,0.00794488853878445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,8192,0.18951022624969482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,5120,0.007657777931955125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,4096,0.007305777735180325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,3584,0.00833422193924586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,7168,0.16638310750325522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,6144,0.14086933930714926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,3072,0.0076657773719893555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,5120,0.11491644382476807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,4096,0.08897155523300171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,2560,0.006879999819729064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,3584,0.0776711106300354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,2048,0.005231110999981563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,1536,0.004575110971927643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,1024,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,3072,0.06736266613006592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,2560,0.056651552518208824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,2048,0.0452133317788442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,768,0.0038693332009845306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,1536,0.03453600075509813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,256,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,1024,0.026428444517983332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,51200,1.1280924479166667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,768,0.022282666630215112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,512,0.018564444449212816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,64,0.0025235555238193935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,32,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,256,0.014039999908871122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,128,0.012103999654452005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,65536,1.4417431089613173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,64,0.012087110843923358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3072,32,32,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,512,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3072,32,128,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,12288,2.673364427354601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,10240,2.183344946967231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,12288,3.095976935492622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,16384,3.5653610229492188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,10240,2.5206737518310547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,16384,4.326263003879123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,8192,1.7662204106648762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,7168,1.5176311069064672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,6144,1.3354177474975586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,8192,1.9365270402696397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,7168,1.7244577407836914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,5120,1.1135128868950737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,4096,0.8936292860243055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,6144,1.4288497500949437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,4096,0.9407208760579427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,5120,1.211937798394097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,3584,0.7935671276516385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,3072,0.6806746588812934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,2560,0.5421706835428873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,3584,0.8588622411092123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,3072,0.7181386417812772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,2560,0.6086026827494303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,2048,0.518855094909668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,1024,0.22335288259718153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,1536,0.3948933283487956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,2048,0.5836515426635742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,768,0.17966843975914848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,1024,0.3856311109330919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,512,0.13599556022220188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,768,0.23553511831495497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,256,0.10604000091552734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,128,0.07922577857971191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,512,0.20998399787478975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,64,0.06789866420957777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,256,0.18348799811469185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,32,0.07123821973800659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,128,0.17994756168789336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,64,0.17365154955122206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,32,0.17691555288102892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,1536,0.3094408777025011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,65536,51200,11.006755405002169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,16384,2.6877110799153647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,12288,2.1131057739257812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,16384,3.4234142303466797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,12288,2.463382297092014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,10240,1.831033706665039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,8192,1.4370942645602758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,10240,1.9890213012695312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,7168,1.2517236073811848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,65536,51200,17.099129570855034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,51200,8.769579569498697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,8192,1.592500474717882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,7168,1.343143145243327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,6144,1.0589617623223198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,5120,0.9535350799560547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,4096,0.6211333274841309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,5120,0.9607893625895182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,6144,1.1857884724934895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,3072,0.4717066552903917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,3584,0.705442640516493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,4096,0.7935795783996582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,3584,0.6904017660352918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,3072,0.5769511328803169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,2048,0.3184533384111193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,2560,0.4275360107421875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,65536,11.147356669108072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,1536,0.245194673538208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,1024,0.2014311154683431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,768,0.14074933528900146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,2048,0.404146671295166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,1536,0.33684621916876895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,2560,0.506864865620931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,512,0.10370933347278172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,256,0.0758426653014289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,128,0.06452711423238118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,768,0.20272355609469941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,1024,0.24988177087571886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,256,0.14329155286153158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,64,0.06356000237994723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,128,0.13589866956075033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,64,0.13997956116994223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,32,0.1383484469519721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,512,0.1617964506149292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,51200,32,0.06521155436833699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,16384,0.9192541970147027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,51200,13.905937194824219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,16384,1.278678258260091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,12288,0.7056630982293023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,51200,2.9343022240532766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,12288,0.9697732925415039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,10240,0.5733111169603136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,8192,0.4487297799852159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,10240,0.7815030945671929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,65536,3.757676442464193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,7168,0.4105839994218614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,8192,0.6216204431321886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,6144,0.3440391222635905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,5120,0.32655466927422416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,7168,0.6108320024278429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,4096,0.2303466796875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,6144,0.4826346503363715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,5120,0.37390489048428005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,3584,0.19569955931769478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,3072,0.16619466410742864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,2560,0.14003554979960123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,3584,0.30956710709465873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,2048,0.1136746671464708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,2560,0.19723378287421334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,3072,0.22581421004401314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,1024,0.061584002441830106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,2048,0.1799128850301107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,768,0.047945777575174965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,51200,5.099096086290148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,1536,0.12920178307427302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,512,0.039926220973332725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,1024,0.09694044457541572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,256,0.02909244431389703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,768,0.07802133427725898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,512,0.06697511010699801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,128,0.027948445743984644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,256,0.056461334228515625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,64,0.022648889157507155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,128,0.05345777670542399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,32,0.020901333954599168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,64,0.05567200316323174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,32,0.054155555036332875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,4096,0.38900444242689347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,16384,1536,0.08863644467459784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,16384,65536,6.39468977186415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,51200,65536,18.383309258355034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,16384,0.5941013230217828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,12288,0.5100337664286295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,10240,0.42495377858479816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,16384,1.0461680094401042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,12288,0.7870622211032443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,8192,0.29791466395060223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,51200,2.0785581800672746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,7168,0.25359733899434406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,10240,0.6657742394341363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,65536,2.6046986050075955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,8192,0.5031769010755751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,6144,0.2436924510531955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,5120,0.22100978427463105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,7168,0.4685360060797797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,4096,0.16212356090545654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,6144,0.3738124370574951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,3584,0.14735644393497044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,5120,0.3077270984649658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,3072,0.12781511412726507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,2560,0.10661511288748847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,2048,0.0873146653175354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,3584,0.2135946618186103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,4096,0.2658640013800727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,1536,0.06870666477415296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,3072,0.18564532862769234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,1024,0.04895111256175571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,2560,0.1599066654841105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,768,0.03874666823281182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,2048,0.14528089099460179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,1536,0.105131553279029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,256,0.02219377789232466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,1024,0.08671022123760647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,768,0.06623644298977323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,64,0.016155555844306946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,256,0.04593333270814684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,32,0.016161777906947665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,512,0.05483288897408379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,64,0.04214844438764784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,32,0.0411137772930993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,51200,3.8937759399414062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,512,0.029639111624823675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,12288,128,0.019371555911170114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,128,0.043624000416861645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,12288,65536,5.043206108940972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,16384,0.5493724611070421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,12288,0.4207599957784017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,10240,0.364595545662774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,16384,0.9019360012478299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,51200,1.8780364990234375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,12288,0.6808604664272733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,8192,0.3066399892171224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,7168,0.257006221347385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,10240,0.5727013481987847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,65536,2.4719823201497397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,6144,0.23000176747639975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,8192,0.4427777661217584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,7168,0.3900880018870036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,5120,0.16794044441647002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,4096,0.152620448006524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,3584,0.12216267320844863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,6144,0.34011289808485246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,4096,0.2159573369556003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,5120,0.2930986616346571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,3072,0.11727110544840495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,3584,0.191213329633077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,2560,0.0915457804997762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,2048,0.07563822136984931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,1536,0.05894222524431017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,1024,0.04377777708901299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,3072,0.16541422737969294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,768,0.03194488750563727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,2560,0.14235822359720865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,2048,0.12253777186075847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,512,0.02460622290770213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,1536,0.09563999705844456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,256,0.020464888877338834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,128,0.016570667425791424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,1024,0.07120355632570055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,64,0.015036443869272867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,768,0.05713955561319987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,512,0.04736977815628052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,256,0.03902755512131585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,128,0.03701688845952352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,64,0.03522488805982802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,32,0.03461777832772996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,51200,3.5195679134792752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,16384,0.42307554350958926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,12288,0.32296445634629994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,10240,65536,4.497909122043185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,16384,0.800871107313368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,10240,32,0.019302222463819716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,51200,1.4203039805094402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,10240,0.2859271102481418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,8192,0.24959288703070748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,65536,1.8554276360405817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,10240,0.4866177770826552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,7168,0.21510667271084258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,6144,0.17732621563805473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,8192,0.3989235560099284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,5120,0.14754399988386366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,4096,0.11457067065768772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,6144,0.33706045150756836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,5120,0.23952889442443848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,3584,0.10625955793592666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,3072,0.08741955624686347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,4096,0.2028728855980767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,3584,0.1667342185974121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,2560,0.07265066438251071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,2048,0.0651351081000434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,12288,0.6028506490919325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,3072,0.14779999521043566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,51200,2.9025804731580944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,1536,0.04725955592261421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,2560,0.12485422028435601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,1024,0.03477777706252204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,768,0.02622933354642656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,512,0.020377778344684176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,2048,0.10454044739405315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,1536,0.0835919976234436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,256,0.015781333049138386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,1024,0.06197333335876465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,128,0.013983999689420065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,768,0.05151999990145365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,64,0.011872889267073737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,512,0.039965334865782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,8192,32,0.012030222349696688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,256,0.033095998896492854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,128,0.03059555424584283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,7168,0.3750586774614122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,64,0.030887110365761652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,32,0.030159999926884968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,8192,65536,3.8612179226345487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,16384,0.3836986753675673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,12288,0.3184728887346056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,16384,0.7242639859517416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,10240,0.2720675468444824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,12288,0.5508755577935113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,8192,0.20775911543104383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,10240,0.4510400030348036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,7168,0.18551999992794463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,6144,0.15552443928188747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,65536,1.645608901977539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,8192,0.4045404328240289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,7168,0.3146924442715115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,5120,0.12488088342878555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,4096,0.09933688905504014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,6144,0.29368888007269967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,3584,0.08220622274610731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,3072,0.07553511195712619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,5120,0.2348853217230903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,4096,0.1734080049726698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,2560,0.06304888592825995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,3584,0.1570133368174235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,2048,0.05267911156018575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,3072,0.14015644126468235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,1024,0.027373333772023518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,2560,0.12014399634467231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,2048,0.09917866521411473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,768,0.022384888596004907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,1536,0.07708355453279284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,512,0.017487110363112558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,256,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,1024,0.05731822384728325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,128,0.011799111134476133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,768,0.047600001096725464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,51200,1.1930586496988933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,512,0.037216888533698186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,64,0.010661332971519895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,256,0.030568887790044148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,32,0.011035555766688453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,51200,2.580486297607422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,128,0.02845422095722622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,32,0.027820444769329492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,16384,0.30721065733167857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,7168,1536,0.04315822323163351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,65536,3.3639956580268016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,12288,0.26289865705702037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,16384,0.6729555659823947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,65536,1.3140124215020073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,10240,0.2156684398651123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,12288,0.5029528935750326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,7168,64,0.02848177817132738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,8192,0.1770239935980903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,7168,0.14633688661787245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,6144,0.1339848836263021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,10240,0.4175208939446344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,8192,0.358328898747762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,5120,0.11457510789235432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,7168,0.29301155938042533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,4096,0.08919911252127753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,6144,0.24863200717502168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,3584,0.07410844167073567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,5120,0.2032702234056261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,3072,0.06575110885832045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,2560,0.05433333251211378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,3584,0.1420960028966268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,51200,1.01619381374783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,2048,0.0440248880121443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,3072,0.12387555175357395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,1536,0.03497599893146091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,2560,0.11015022463268703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,51200,2.376636505126953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,1024,0.02385066615210639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,768,0.02054222259256575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,512,0.015252444479200574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,1536,0.07038399908277723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,2048,0.08928800291485256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,256,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,768,0.04271733429696825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,1024,0.052983999252319336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,128,0.010501333408885531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,64,0.009313777916961247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,512,0.03544888893763224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,6144,32,0.009306666751702627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,256,0.028029332558314007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,128,0.026093333959579468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,65536,2.964813232421875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,32,0.02642044425010681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,16384,0.2996506690979004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,51200,0.8722071117824979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,65536,1.1680853101942275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,16384,0.6097200181749132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,12288,0.2383955584632026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,64,0.0258240004380544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,10240,0.1841813325881958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,8192,0.1412364509370592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,7168,0.11706488662295872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,12288,0.49404266145494247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,10240,0.40717599127027726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,6144,4096,0.182732449637519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,8192,0.30751199192470974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,6144,0.11525600486331516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,5120,0.08735111024644639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,4096,0.07493955559200711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,7168,0.26890844768948025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,3584,0.06938133637110393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,6144,0.23097599877251518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,5120,0.18712000052134195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,3072,0.058127111858791776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,2560,0.04600266615549723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,4096,0.14694400628407797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,2048,0.036638223462634616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,51200,2.1097422705756292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,1536,0.030125333203209773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,3584,0.1305448876486884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,1024,0.021521778570281133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,3072,0.11471111244625515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,768,0.01737422247727712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,2560,0.09722755352656047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,512,0.014144000079896716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,2048,0.08223022354973687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,256,0.010384000009960597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,1536,0.064355558819241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,1024,0.04841244551870558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,768,0.041830221811930336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,64,0.008328888979223039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,256,0.02571644385655721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,32,0.009338666995366415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,128,0.023709333605236475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,65536,2.6337547302246094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,64,0.02346755564212799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,32,0.023349333140585158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,16384,0.2382133271959093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,12288,0.1597786611980862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,51200,0.7032408714294434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,65536,0.9878070619371203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,10240,0.16158044338226318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,5120,128,0.009655111365848118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,12288,0.4289626545376248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,8192,0.1511875523461236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,5120,512,0.031890667147106595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,7168,0.10800177521175808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,6144,0.09240355756547715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,10240,0.39584533373514813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,8192,0.27940000428093803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,7168,0.29209778043958873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,4096,0.06301955382029216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,6144,0.20867466926574707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,3584,0.05940000216166178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,5120,0.18029867278205025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,3072,0.04878044459554884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,4096,0.1423893372217814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,2560,0.04099022348721822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,3584,0.11970578299628364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,2048,0.034279998805787824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,51200,1.834520975748698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,1536,0.02716355522473653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,16384,0.5548337830437554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,3072,0.10542666912078857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,1024,0.017356443736288283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,2560,0.09092266692055596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,2048,0.07158488697475858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,512,0.011921777493423887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,1536,0.058261334896087646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,1024,0.04340089029735989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,256,0.00924355536699295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,768,0.03602666656176249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,128,0.00758844448460473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,64,0.0069155556460221606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,512,0.028668443361918133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,65536,2.3384390936957464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,32,0.006989333364698622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,256,0.023201778531074524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,128,0.02165066699186961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,64,0.021317332983016968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,4096,32,0.021125333176718816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,5120,0.07839466465844049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,16384,0.22746666272481283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,12288,0.16104888916015625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,51200,0.6436364385816786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,65536,0.7639093399047852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,16384,0.5268533494737413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,10240,0.13460889127519396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,4096,768,0.014312000738249885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,8192,0.1065066655476888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,7168,0.09415111276838516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,12288,0.4010942247178819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,6144,0.08704533179601033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,10240,0.34829065534803605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,8192,0.3002320130666097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,7168,0.23307998975118002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,4096,0.053095112244288124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,6144,0.1994382275475396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,3584,0.046704888343811035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,5120,0.16581332683563232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,3072,0.03931555483076308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,2560,0.03558311197492812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,4096,0.1280097828971015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,3584,0.11295555697547065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,2048,0.027348443865776062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,3072,0.09926399919721816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,1536,0.02312266661061181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,1024,0.01742755538887448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,2560,0.08681066830952962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,768,0.015152888165579902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,2048,0.06796266635258992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,512,0.01184622198343277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,1536,0.05561511384116279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,1024,0.04114400015936957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,256,0.008953777452309927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,768,0.033760888708962336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,512,0.027317333552572463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,64,0.00666133314371109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,256,0.02196088929971059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,128,0.02058844433890449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,32,0.0068915556702348925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,64,0.020280000236299302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,32,0.01992266707950168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,5120,0.06785066922505696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,65536,0.6101484298706055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,16384,0.1665982272889879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,51200,0.49901511934068465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,12288,0.12185245090060765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,51200,1.7449146906534831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,10240,0.1111804379357232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3584,128,0.007595555649863348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,8192,0.08930489089753892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,12288,0.4029031064775255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,7168,0.08258755339516534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3584,65536,2.2527963850233292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,10240,0.31258755260043675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,6144,0.06667288806703356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,5120,0.05544355511665344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,8192,0.25170400407579213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,4096,0.044236444764667086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,7168,0.2245262198978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,3584,0.041672888729307384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,6144,0.1867333385679457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,3072,0.03494666682349311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,4096,0.12092088328467475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,2560,0.02773155603143904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,2048,0.02370133333735996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,3584,0.10830577876832749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,3072,0.09275466865963405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,1536,0.01906488835811615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,2560,0.07912800047132704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,51200,1.6410551071166992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,2048,0.06452888912624784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,768,0.011719110939237805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,1536,0.04999644557634989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,512,0.009249777429633671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,256,0.007263999846246507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,1024,0.038549333810806274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,768,0.03155288762516446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,128,0.006625777731339137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,65536,2.0642231835259333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,64,0.005943999936183293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,512,0.02574577762020959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,32,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,256,0.021088000800874498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,128,0.019342222147517733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,64,0.018901333212852478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,32,0.018887110882335238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,16384,0.5147920184665257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,16384,0.14115911059909397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,3072,5120,0.1603271166483561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,65536,0.5547893312242296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,51200,0.4440240065256755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,12288,0.11224533451928033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,10240,0.0925333301226298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,8192,0.07386489046944512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,3072,1024,0.014626666903495789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,16384,0.4662462340460883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,7168,0.06624088684717815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,12288,0.3658586608039008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,6144,0.054451555013656616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,10240,0.2971137894524468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,5120,0.04786044359207153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,8192,0.2600462171766493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,4096,0.036348445547951594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,7168,0.2090817822350396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,3584,0.033843557039896645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,6144,0.177236451043023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,3072,0.029321776496039495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,5120,0.14489332834879556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,2560,0.02532800038655599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,2048,0.021575111481878493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,3584,0.10200977987713283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,1536,0.0177839994430542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,3072,0.0890008873409695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,2560,0.07484000258975558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,1024,0.013745778136783175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,2048,0.06232355700598823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,768,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,512,0.009654222263230218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,1536,0.04866310954093933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,256,0.007652444144090016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,1024,0.03633066680696275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,768,0.029841777351167467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,128,0.005940444353553984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,64,0.005557333429654439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,512,0.024511110451486375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,65536,1.8984425862630208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2560,32,0.005548444473081165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,256,0.01925244430700938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,128,0.01819022165404426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,64,0.01757777730623881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,32,0.017854221993022494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,16384,0.12566755877600774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,51200,0.3530257807837592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,65536,0.4273048771752252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,12288,0.0908542209201389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,10240,0.07748711109161377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,4096,0.11892178323533799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,8192,0.06350666946834989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,16384,0.4371493392520481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2560,51200,1.4965795940823023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,12288,0.348307556576199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,7168,0.05632355478074816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,6144,0.046570665306515165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,5120,0.037363555696275495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,10240,0.30013243357340497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,8192,0.22408623165554473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,4096,0.0317520002524058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,7168,0.19623200098673502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,3584,0.02811288833618164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,6144,0.16580711470709905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,3072,0.024752888414594863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,5120,0.13709510697258845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,2560,0.020896888441509668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,2048,0.01716088917520311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,4096,0.10732444127400716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,1536,0.013986666997273764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,3584,0.09455821911493938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,1024,0.01075644459989336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,3072,0.08353422085444133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,51200,1.365995513068305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,768,0.008924444516499838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,2048,0.05973955657747057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,512,0.0070977773931291364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,256,0.00627377794848548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,1536,0.0449022220240699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,1024,0.032913777563307024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,128,0.00553688903649648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,768,0.028040889236662123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,64,0.004629333400064045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,2048,32,0.004881777697139316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,65536,1.74273861779107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,256,0.01843644513024224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,128,0.017186666528383892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,64,0.016823111308945548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,32,0.016488000750541687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,16384,0.08691555261611938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,12288,0.06739466720157199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,51200,0.26382933722602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,65536,0.3376595444149441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,10240,0.05910755528344048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,8192,0.0503768887784746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,16384,0.41411911116705996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,10240,0.2633857727050781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,12288,0.3136133352915446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,7168,0.03756266501214769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,8192,0.21687822871738008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,6144,0.03326311045222812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,5120,0.0281315545241038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,2560,0.07083288828531902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,7168,0.1845759948094686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,4096,0.023741333021057978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,6144,0.16046399540371364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,3584,0.0211191111140781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,5120,0.12885955969492593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,2048,512,0.023324444890022278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,3072,0.018717333674430847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,4096,0.1012079980638292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,2560,0.016544888416926067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,2048,0.013995556367768182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,51200,1.2783600489298503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,1536,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,3072,0.07910577456156413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,2560,0.06635200315051608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,768,0.00795999997191959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,2048,0.054084443383746676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,512,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,1536,0.0420684450202518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,1024,0.031521777311960854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,256,0.005528000079923206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,768,0.026312000221676294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,65536,1.6348195605807836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,128,0.004559111264016894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,512,0.021779555413458083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,64,0.00453333349691497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,32,0.004536889079544279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,256,0.017469333277808297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,128,0.015643555257055495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,64,0.015472888946533203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,32,0.015188443991872998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,65536,0.2539964516957601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,51200,0.19386933909522164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,12288,0.04650488826963636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,16384,0.3937351173824734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,12288,0.29141778416103786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1536,3584,0.09245866537094116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,10240,0.04158044523662991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1536,1024,0.009031111167536842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,8192,0.0311173333062066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,7168,0.027448000179396734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,6144,0.023511999183230933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,5120,0.02108888824780782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,10240,0.24438577228122285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,8192,0.20194578170776367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,4096,0.0173662222094006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,6144,0.145233776834276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,3584,0.015285332997639975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,3072,0.014055111342006259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,5120,0.11842400497860378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,51200,1.1767750846015084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,2560,0.012042666474978128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,4096,0.09404622183905707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,2048,0.010336000058386061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,3584,0.08267466889487372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,3072,0.07179199986987643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,16384,0.06349422534306844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,65536,1.4994391335381403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,1024,0.0070497774415545994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,2048,0.049031111929151744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,768,0.006252444452709622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,512,0.005555555638339784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,1536,0.0387644436624315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,256,0.004545777622196409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,1024,0.029045333464940388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,768,0.024339555038346186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,512,0.020247111717859905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,256,0.01625066664483812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,32,0.0038311113086011675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,128,0.01477777792347802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,64,0.014458666245142618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,32,0.014126222994592456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,65536,0.20658489068349203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,51200,0.15761066807640925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,16384,0.05239911211861504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,7168,0.172015110651652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,12288,0.038430223862330117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,1536,0.008797333472304875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,10240,0.03192799952295091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,16384,0.3721742100185818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,8192,0.026542221506436665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,12288,0.28280533684624565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,7168,0.023689778314696416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,128,0.004208000169859992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,1024,64,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,6144,0.02096533278624217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,10240,0.2372791237301297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,5120,0.018280888597170513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,4096,0.015385778413878547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,8192,0.1906133360332913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,7168,0.16717333263821074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,3584,0.01350933313369751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,3072,0.01198933356338077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,6144,0.14126133918762207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,5120,0.11452444394429524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,51200,1.1414995193481445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,4096,0.09029777844746907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,2560,0.011063111325105032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,2048,0.009367110828558603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,65536,1.451282713148329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,3584,0.08024711079067655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,1536,0.008967999782827165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,3072,0.06974844137827556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,1024,0.007255111303594377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,768,0.005960888746711943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,2048,0.04650488826963636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,512,0.0052684446175893145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,1536,0.036680890454186335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,1024,0.02775555517938402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,128,0.003867555409669876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,768,0.023707555400000677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,64,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,512,0.019661333825853135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,256,0.015481778317027621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,32,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,128,0.014105778601434497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,64,0.013768889009952545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,32,0.013766222529941134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,65536,0.1528657807244195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,16384,0.04181333382924398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,51200,0.12072622776031494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,12288,0.03012266755104065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,16384,0.3621075683169895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,12288,0.27420088979932994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,10240,0.02384888960255517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,8192,0.01960177719593048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,768,2560,0.05905510981877645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,7168,0.01752622259987725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,768,256,0.004519999855094486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,10240,0.23054843478732637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,6144,0.015557333827018738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,8192,0.18513154983520508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,5120,0.013291555146376291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,4096,0.011805333197116852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,7168,0.16177599959903294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,51200,1.1033990648057725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,6144,0.1373306645287408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,1024,2560,0.061214221848381885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,3584,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,5120,0.11094311210844253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,3072,0.011482666763994427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,2560,0.009883555273214975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,4096,0.08733510971069336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,2048,0.008956444760163626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,1536,0.007610666255156199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,65536,1.408890618218316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,1024,0.006058666855096817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,3584,0.07738933298322889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,3072,0.06764444377687243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,768,0.00555644432703654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,2560,0.056695110268063016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,512,0.004576888763242298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,2048,0.0455644428730011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,256,0.004013333469629288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,1536,0.03502666619088914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,128,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,1024,0.027076444692081873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,64,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,512,32,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,768,0.023043556345833674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,512,0.01924533314175076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,256,0.014827556080288358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,128,0.01348000019788742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,65536,0.10632622241973877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,64,0.013119999733236102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,512,32,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,51200,0.08095733324686687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,16384,0.03313244382540385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,12288,0.0222044438123703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,10240,0.01907999979125129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,8192,0.013863999810483722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,7168,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,6144,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,8192,0.17977778116861978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,10240,0.22320087750752768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,12288,0.26585067643059623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,16384,0.3504355483584934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,7168,0.15701511171129015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,5120,0.010092444717884064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,4096,0.008856000171767341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,6144,0.1329208877351549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,3584,0.008047999607192146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,3072,0.0075288886825243635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,2560,0.006643555644485686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,2048,0.005940444353553984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,5120,0.10759555631213719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,4096,0.084733333852556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,3584,0.07436355617311266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,3072,0.06457866562737359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,2560,0.053970668050977916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,1024,0.004545777622196409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,768,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,2048,0.042790220843421094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,512,0.003559111307064692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,1536,0.034007999632093645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,1024,0.026214222113291424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,256,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,768,0.022488888767030504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,128,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,512,0.018530666828155518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,64,0.0028826666788922418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,51200,1.0673351287841797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,32,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,256,0.014442667365074158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,128,0.013073777986897362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,64,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,32,0.012488000094890594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,51200,0.054526223076714404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,256,65536,1.3636471430460613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,16384,0.018593778212865193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,12288,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,10240,0.013859555953078799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,16384,0.34056443638271755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,12288,0.25866577360365123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,10240,0.217412445280287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,7168,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,256,1536,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,8192,0.17461333009931776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,6144,0.010497777826256223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,5120,0.009323555562231276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,7168,0.15240355332692465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,4096,0.007948444121413762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,51200,1.0377893447875977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,6144,0.12911289268069798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,5120,0.10407644510269165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,3584,0.007606222397751278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,3072,0.006969778074158563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,4096,0.08151733213000827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,65536,0.06491111384497748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,2560,0.006074666563007567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,65536,1.3282257715861003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,2048,0.005572444448868434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,3584,0.07221244441138373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,1536,0.004872000051869286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,3072,0.06189511219660441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,1024,0.004378666480382283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,768,0.0041777777175108595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,2560,0.052728000614378184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,512,0.003605333467324575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,1536,0.032644444041781955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,256,0.0032044444233179092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,1024,0.025536888175540503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,768,0.02196888956758711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,512,0.018188445104493033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,64,0.002903999967707528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,256,0.013760888742076026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,32,0.0029608888758553397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,128,0.01237777786122428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,8192,0.014129777749379476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,65536,0.06288888719346789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,64,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,32,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,51200,0.052461332745022245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,16384,0.014480888843536377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,12288,0.014185777968830533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,10240,0.012718222207493253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,12288,0.25844889216952854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,16384,0.3404924339718289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,10240,0.216776000128852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,7168,0.01073688848151101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,8192,0.17457955413394502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,6144,0.009471110999584198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,128,2048,0.04145066605673896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,5120,0.009312888814343346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,4096,0.007717333734035492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,128,128,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,3584,0.007304000357786815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,51200,1.0373200310601127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,6144,0.1288951105541653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,3072,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,5120,0.10371288988325332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,2560,0.006217777729034424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,4096,0.08181511031256782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,2048,0.005566222386227713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,3584,0.07171999745898776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,1536,0.0047377778424157035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,65536,1.3273333443535698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,1024,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,2560,0.05205511053403219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,2048,0.040560000472598605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,1536,0.032582223415374756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,512,0.003519999898142285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,1024,0.02535199953450097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,256,0.0033493333806594214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,768,0.02164977788925171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,128,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,64,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,512,0.017679999272028606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,256,0.013776000175211163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,32,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,8192,0.01146577795346578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,128,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,65536,0.06344622373580933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,51200,0.05046222276157803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,32,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,16384,0.013464888764752282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,7168,0.15206666787465414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,12288,0.011057777537239922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,16384,0.3406826655069987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,3072,0.06255377663506402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,64,768,0.0038897775941424896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,8192,0.009105777574910058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,10240,0.21676354938083223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,51200,1.0370897716946073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,7168,0.008636444807052612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,6144,0.008992888861232335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,64,64,0.0119991112086508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,5120,0.007607999775144789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,65536,1.325295130411784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,4096,0.009367110828558603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,7168,0.15228266186184353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,6144,0.12865422831641302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,3584,0.008968888885445064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,5120,0.10385066933102077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,3072,0.007992888490358988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,2560,0.007452444069915348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,4096,0.08141155375374688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,2048,0.005223999834722943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,3584,0.07252177927229139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,3072,0.062146663665771484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,1536,0.004551110996140374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,2560,0.051338666015201144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,1024,0.004024888906213972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,768,0.0037804444630940757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,2048,0.04112977782885233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,512,0.00319377767542998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,1536,0.03256977929009332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,10240,0.010463111102581024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,256,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,1024,0.02536800007025401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,12288,0.2582186592949761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,128,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,64,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,512,0.01789866718981001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,256,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,128,0.012167111039161682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,64,0.011804444094498953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,32,0.011883555187119378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,8192,0.17419466707441542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2817,32,768,0.021547555923461914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2817,32,32,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,16384,3.554672876993815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,12288,2.7115306854248047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,12288,3.059414121839735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,16384,4.214844597710504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,10240,2.40245607164171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,16384,3.7490916781955295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,10240,2.4915688832600913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,12288,2.825145721435547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,10240,2.3201270633273654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,8192,1.9622781541612413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,8192,2.0103261735704208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,7168,1.6989066865709093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,7168,1.644002702501085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,8192,1.8600514729817708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,6144,1.5537849002414281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,5120,1.152135107252333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,7168,1.6324151357014973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,6144,1.4213120142618816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,51200,11.559560139973959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,5120,1.1940782335069444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,6144,1.3912870619032118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,4096,0.9028861787584094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,4096,0.9402151107788086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,3584,0.7568755679660373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,5120,1.148206180996365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,3584,0.8429519865247938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,3072,0.6511164241366917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,4096,0.8967840406629773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,3584,0.8107795715332031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,2560,0.5398497581481934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,3072,0.7410755687289767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,2560,0.6360088984171549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,2048,0.5002186563279893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,3072,0.6899555524190267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,2048,0.505933337741428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,2560,0.5783084233601888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,2048,0.47886843151516384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,1024,0.2370213402642144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,1536,0.4821750852796767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,1024,0.3059191173977322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,768,0.18716000186072457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,1536,0.38974044058058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,1024,0.2943271001180013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,512,0.14348355929056802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,256,0.10662577549616496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,512,0.20460177792443168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,512,0.19445333215925428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,128,0.07856533262464735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,256,0.1508071157667372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,256,0.18641689088609484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,64,0.07750933037863837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,128,0.1655528942743937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,1536,0.3914195431603326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,65536,32,0.07427466577953763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,128,0.11820977263980442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,64,0.16954310735066733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,32,0.16893333858913848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,768,0.252745787302653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,768,0.23727022276984322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,65536,51200,17.58661397298177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,65536,51200,12.71504126654731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,16384,2.763107511732313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,16384,3.345373365614149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,12288,2.029588487413194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,51200,8.575285169813368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,16384,3.01621945699056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,65536,10.810956319173178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,12288,2.37534311082628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,10240,1.8218729231092665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,12288,2.24053955078125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,8192,1.3884230719672308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,10240,2.0020692613389754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,51200,13.208812289767794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,10240,1.9001172383626301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,8192,1.6251067055596247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,7168,1.2653208838568795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,7168,1.3276631037394206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,6144,0.9930008782280816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,8192,1.4770124223497179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,6144,1.1607049306233723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,7168,1.259259541829427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,5120,0.8550186687045627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,5120,0.9669884575737847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,65536,16.7509765625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,4096,0.6389093399047852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,6144,1.1112506654527452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,51200,11.275763617621529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,5120,0.9221377902560763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,4096,0.8191102345784506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,3584,0.6145173178778754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,3072,0.608824888865153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,3584,0.6849102444118924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,4096,0.7177528805202908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,3072,0.6010408931308323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,2560,0.5128222041659886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,3584,0.6379342079162598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,2048,0.31020977762010365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,3072,0.571656862894694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,1536,0.23068621423509386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,2048,0.399292442533705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,2560,0.46606487698025173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,1024,0.1753164397345649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,2560,0.5022088686625162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,2048,0.421415991253323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,768,0.13276178307003444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,1024,0.2359457810719808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,65536,13.200464036729601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,512,0.10682577557033962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,1024,0.23293511072794595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,768,0.18839200337727866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,256,0.08077777756585015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,768,0.20414222611321342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,512,0.15949243969387478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,128,0.06700888607237074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,256,0.12487288316090901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,64,0.05623200204637316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,128,0.09713955720265706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,51200,32,0.05573778020011055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,256,0.14029067092471653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,512,0.20106044080522326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,64,0.13357422086927626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,128,0.13320710923936632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,32,0.13501066631740993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,51200,1536,0.3258435461256239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,51200,1536,0.3164142237769233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,16384,0.7840906778971354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,16384,1.2663617663913302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,12288,0.594538688659668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,51200,2.8356107076009116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,16384,1.2354852888319228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,65536,3.492263158162435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,10240,0.4923404587639703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,12288,0.9386702643500434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,8192,0.4046177864074707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,12288,0.9264764785766602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,10240,0.7792551252577039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,10240,0.7904444270663791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,7168,0.3475920094384088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,51200,4.754025777180989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,8192,0.6234986517164443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,8192,0.6352328724331325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,6144,0.3400551213158502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,6144,0.45014132393731016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,7168,0.5264115333557129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,5120,0.3219946755303277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,7168,0.5555129051208496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,51200,4.083484649658203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,4096,0.25707822375827366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,6144,0.47238487667507595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,65536,5.9981172349717875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,4096,0.29376088248358834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,5120,0.39143911997477215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,3584,0.22050133016374376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,4096,0.3395644558800592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,3584,0.2583351135253906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,3072,0.1707306702931722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,3584,0.2968062294854058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,3072,0.2236257659064399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,2048,0.1094391081068251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,2560,0.19253155920240614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,3072,0.2515519989861382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,2560,0.21887021594577363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,1536,0.08987733390596177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,2048,0.15784800052642822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,2048,0.17812800407409668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,1024,0.05811022387610542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,1536,0.12616799937354192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,1536,0.14381333192189535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,768,0.046111110183927745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,5120,0.3687475522359212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,1024,0.09603822231292725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,512,0.03795911206139459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,768,0.07643200291527642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,768,0.09258133172988892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,256,0.026287110315428838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,512,0.06536000304751925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,512,0.07630488607618544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,128,0.023039110832744177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,256,0.05590044127570259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,256,0.05976533227496677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,64,0.025454221500290766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,128,0.05235111051135593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,128,0.04885244369506836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,32,0.026086222794320848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,16384,2560,0.12431732813517253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,64,0.05260711246066623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,16384,32,0.05272000034650167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,65536,5.224420335557726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,16384,1024,0.11033155520757039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,16384,0.6932649082607694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,51200,2.3079821268717446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,65536,2.7114825778537326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,16384,1.059139569600423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,12288,0.5371528731452094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,16384,1.059509383307563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,10240,0.47663376066419816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,12288,0.7533182038201226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,12288,0.7832524511549207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,51200,3.7332229614257812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,8192,0.3478844430711534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,10240,0.6220791074964735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,7168,0.3163679970635308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,8192,0.5074915356106228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,10240,0.6709751023186578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,7168,0.42714489830864805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,8192,0.5489217970106337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,6144,0.27789423200819224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,65536,4.852464887830946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,6144,0.3698604371812608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,5120,0.2330568896399604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,7168,0.49848355187310117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,51200,3.3724365234375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,4096,0.17267378171284994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,6144,0.401546663708157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,5120,0.34430578019883895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,3584,0.15340888500213623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,4096,0.25309867329067653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,5120,0.3548026614718967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,3072,0.1297422250111898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,4096,0.2773742145962185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,3584,0.21142133076985678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,2560,0.1098124451107449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,3584,0.24245333671569824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,2048,0.08665511343214248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,3072,0.19106222523583305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,3072,0.21850044197506377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,1536,0.06681155496173434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,65536,4.3876728481716585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,2048,0.13182489077250162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,1024,0.04838666650984022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,2048,0.1531404389275445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,768,0.04225155711174011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,1536,0.12601510683695474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,1536,0.10680088731977676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,1024,0.09603466590245564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,512,0.029926220575968426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,1024,0.08742577499813503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,768,0.06375822093751696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,768,0.08084711101320055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,128,0.01830755505296919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,512,0.05397689011361864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,256,0.046635554896460645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,64,0.023648000425762598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,128,0.043771555026372276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,32,0.023247111174795363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,64,0.04099199838108487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,32,0.03990311092800564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,2560,0.1627555555767483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,2560,0.18326221572028267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,12288,256,0.028195556667115953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,512,0.0665102203687032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,12288,256,0.05212622218661838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,12288,128,0.04110755523045858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,16384,0.5330133438110352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,65536,2.1438479953342013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,16384,0.9644159740871854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,12288,0.41534490055508083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,51200,1.6671066284179688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,16384,0.9488097296820747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,10240,0.33648888270060223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,12288,0.7180977927313911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,10240,0.554931534661187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,8192,0.28260800573560924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,12288,0.7110462188720703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,65536,4.41976081000434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,10240,0.6018640200297037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,8192,0.43638043933444554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,51200,2.9827974107530384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,8192,0.5005306667751735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,6144,0.19394666618771025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,7168,0.4171902338663737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,5120,0.15500888559553358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,7168,0.4249724547068278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,6144,0.33167733086480033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,65536,3.8453822665744357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,5120,0.2764506604936388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,6144,0.36699644724527997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,51200,3.4215369754367404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,3584,0.13018488883972168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,5120,0.31462489234076607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,4096,0.21426133314768472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,3072,0.10445600085788304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,3584,0.18741244739956328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,4096,0.25468089845445424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,2560,0.08283288611306085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,7168,0.25709689988030326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,3072,0.16395555602179632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,2048,0.069504890176985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,3072,0.19234577814737955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,2560,0.14104978243509927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,2560,0.16692799992031523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,2048,0.11631555027431911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,1024,0.03814311159981622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,2048,0.13952088356018066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,1536,0.09303377734290229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,768,0.03138044476509094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,1536,0.11318488915761311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,512,0.02293066680431366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,1024,0.0872231125831604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,1024,0.07096355491214328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,768,0.0566542214817471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,256,0.017439110411538016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,512,0.04695555567741394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,128,0.015071110592948066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,256,0.047898666726218335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,256,0.0382008883688185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,4096,0.1319511069191827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,64,0.013162666724787818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,32,0.013120888835854001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,128,0.04019822345839606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,128,0.03596977723969354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,64,0.034613334470325045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,10240,32,0.03479555580351088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,3584,0.21823378403981528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,10240,1536,0.05376177695062426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,768,0.07351377937528822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,10240,512,0.061456885602739125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,16384,0.4398062229156494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,51200,1.7448292838202581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,65536,1.978808085123698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,12288,0.43036799960666233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,16384,0.861752880944146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,12288,0.585810661315918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,10240,0.2554551230536567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,51200,2.8535262213812937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,10240,0.4811520046657986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,12288,0.6648871103922526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,8192,0.2366844548119439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,65536,3.6373439364963107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,10240,0.5571769078572592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,8192,0.38162755966186523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,7168,0.20527556207444933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,8192,0.44578398598565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,6144,0.15972888469696045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,51200,2.6891341739230685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,5120,0.13179288970099554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,7168,0.34612356291876895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,6144,0.3450506793128119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,7168,0.38860532972547746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,4096,0.11212000581953262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,5120,0.2386862172020806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,6144,0.3355964554680719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,3584,0.09496800104777019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,16384,0.7783644464280871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,4096,0.20335822635226777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,65536,3.4716818067762585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,3072,0.08269421921836005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,4096,0.22548532485961914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,3584,0.16514844364590114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,2560,0.07668355438444349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,3584,0.20066844092475045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,2048,0.056162668599022754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,3072,0.1432408889134725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,3072,0.1805208921432495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,2560,0.12692622343699136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,1536,0.041895111401875816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,2560,0.15148888693915472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,1024,0.03131555517514547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,2048,0.10366221931245591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,2048,0.12834489345550537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,768,0.023952000670962866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,1536,0.10478311114841038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,1536,0.08249155680338542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,512,0.018819555640220642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,1024,0.08039466540018718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,768,0.048639999495612256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,1024,0.062215997113121875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,512,0.05638666947682699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,512,0.04031377699640062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,128,0.01481066644191742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,256,0.032250665956073336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,256,0.04418666826354133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,64,0.013802666631009845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,32,0.014087999860445658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,128,0.03014311194419861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,64,0.029912889003753662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,8192,32,0.029583109749688044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,5120,0.30043554306030273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,768,0.06810577710469563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,8192,256,0.014537778165605334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,8192,128,0.03689510954750909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,51200,1.261249754163954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,65536,1.5753129323323567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,16384,0.395322667227851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,12288,0.30575821134779185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,16384,0.7566293080647787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,16384,0.8379128774007162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,12288,0.6198719872368706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,10240,0.28697154257032603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,12288,0.6268480088975694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,8192,0.22255378299289277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,10240,0.4450666639539931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,65536,3.289413240220812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,10240,0.5328559875488281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,7168,0.19949421617719862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,8192,0.35520089997185605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,6144,0.1614097754160563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,8192,0.4277004400889079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,7168,0.31968977716234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,6144,0.26361065440707737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,7168,0.37255199750264484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,5120,0.14514044920603433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,4096,0.11038844452963935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,51200,2.543024910820855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,6144,0.3363617791069879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,5120,0.21954845057593453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,65536,3.2689520517985025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,3584,0.09981244140201145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,4096,0.17293332682715523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,5120,0.2656053437127007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,3072,0.08880800008773804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,3584,0.1543075508541531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,4096,0.2156888908810086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,2560,0.07379733191596137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,3584,0.1929386721716987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,3072,0.1679333315955268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,2048,0.05868089199066162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,2560,0.11578578419155544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,1536,0.04215288824505276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,2560,0.14661867088741726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,2048,0.09576533238093059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,51200,2.4862594604492188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,2048,0.12233244048224555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,768,0.02233422299226125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,1536,0.07661688990063138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,1536,0.09961689180798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,512,0.017633777525689866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,1024,0.07671644290288289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,1024,0.05686666568120321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,768,0.04536177714665731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,256,0.01407911048995124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,768,0.06486311223771837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,128,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,512,0.03690222236845229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,512,0.05361510978804695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,64,0.010287111004193624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,256,0.04051733348104689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,256,0.0299288895395067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,32,0.010224888722101847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,7168,128,0.03423466616206699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,128,0.028159111738204956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,64,0.028173334068722192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,32,0.027464888162083093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,7168,3072,0.13555555873446995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,7168,1024,0.027795556518766616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,16384,0.3554106553395589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,51200,1.0436230765448677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,65536,1.3195341957939994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,12288,0.2694915665520562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,16384,0.6608168813917372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,10240,0.2288773324754503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,12288,0.5164391199747721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,16384,0.7966293228997124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,12288,0.6152702437506782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,10240,0.42270933257208926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,51200,2.2991697523328996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,8192,0.18740888436635336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,10240,0.5047138002183702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,7168,0.16608799828423396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,8192,0.33423466152615017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,6144,0.1322382158703274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,7168,0.28824978404574925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,8192,0.41198134422302246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,65536,3.0235716501871743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,5120,0.11826133728027344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,7168,0.3924097749922011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,6144,0.245194673538208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,4096,0.09271822373072307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,5120,0.2077315515942044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,6144,0.30191289054022896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,3584,0.07567377885182698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,5120,0.2546453211042616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,4096,0.15909955236646864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,4096,0.21220355563693574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,3072,0.06914399729834662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,3584,0.13986133204566106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,2560,0.05551377932230631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,3584,0.18415021896362305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,65536,3.0891378190782337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,3072,0.12242755624983047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,2048,0.04850666721661886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,3072,0.16524444686041936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,1536,0.03517155514823066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,2560,0.10679022471110027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,1024,0.025570667452282373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,2048,0.1164142158296373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,2048,0.08842311302820842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,1536,0.07027910815344916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,1536,0.09541600280337864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,768,0.02129777769247691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,512,0.016200888488027785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,1024,0.05155466662512886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,1024,0.073216888639662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,256,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,768,0.04193333453602261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,51200,2.450416988796658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,512,0.03395288851526048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,512,0.05090399914317661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,128,0.01131199962562985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,256,0.03842577669355605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,256,0.027474666635195415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,64,0.009563555320103964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,6144,32,0.009704888694816166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,128,0.032857778999540545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,128,0.025888888372315302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,64,0.025477333201302424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,6144,32,0.025401777691311304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,2560,0.13848711384667292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,6144,768,0.062013334698147245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,16384,0.3128986623552111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,51200,1.0166275236341689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,65536,1.2793351279364693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,12288,0.2629893355899387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,16384,0.5998311042785645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,12288,0.4653182029724121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,10240,0.171670224931505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,16384,0.7265244589911567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,8192,0.14630044831169978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,12288,0.5636017587449815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,51200,2.086268530951606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,10240,0.38000978363884824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,7168,0.12662133905622694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,10240,0.4702933099534776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,8192,0.31140976481967503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,6144,0.10774399836858113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,7168,0.26641421847873265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,65536,2.7008870442708335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,8192,0.382113774617513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,5120,0.08338933520846897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,7168,0.3370159996880426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,4096,0.06659644179873996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,6144,0.22731643252902559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,6144,0.2777297761705187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,3584,0.05852711200714111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,5120,0.23216978708902994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,3072,0.05374933282534281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,4096,0.14955466323428684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,4096,0.18709244992997912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,51200,2.194960912068685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,3584,0.12906577852037218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,2560,0.0447306666109297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,3584,0.16789778073628744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,2048,0.037251555257373385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,65536,2.7964729732937283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,3072,0.11215999391343857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,3072,0.1474426719877455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,1536,0.027268444498380024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,2560,0.1261626614464654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,2560,0.09632444381713867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,2048,0.08095822069380018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,2048,0.10682844453387791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,768,0.016171556380059984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,1536,0.06353955798678927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,1536,0.08751999669604832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,1024,0.048067556487189404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,1024,0.06781688663694593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,768,0.03793688946300083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,768,0.05750755469004313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,256,0.00965244405799442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,512,0.04759733213318718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,512,0.03154666556252374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,128,0.008347555167145198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,256,0.02574666672282749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,64,0.007722666694058313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,128,0.03132355544302199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,32,0.007983110845088959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,64,0.02334844403796726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,5120,0.18963021702236602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,32,0.02327022287580702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,1024,0.01982666717635261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,5120,512,0.012714666624863943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,5120,256,0.0377511117193434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,65536,1.079262203640408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,5120,128,0.0236453331179089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,51200,0.7563591003417969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,16384,0.30199376742045086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,12288,0.21990756193796793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,16384,0.5442621972825792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,12288,0.4644959767659505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,16384,0.7114933331807455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,10240,0.15851910909016928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,12288,0.5141741964552138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,65536,2.382969750298394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,8192,0.13658400376637778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,51200,1.8531848059760199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,10240,0.34816622734069824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,7168,0.12035022841559516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,8192,0.2805119885338677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,6144,0.10603821939892238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,10240,0.43829067548116046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,8192,0.3517315652635362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,7168,0.24587644471062553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,7168,0.30729688538445366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,6144,0.20517155859205458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,4096,0.064337776766883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,65536,2.64284790886773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,6144,0.2759946717156304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,5120,0.16781866550445557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,5120,0.21880711449517143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,3584,0.050387554698520236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,3072,0.04560533497068617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,51200,2.066176096598307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,4096,0.13354044490390354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,4096,0.17716088559892443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,2560,0.03638489047686259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,3584,0.12123289373185898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,3584,0.15795466634962294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,2048,0.03012977706061469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,3072,0.10255999697579278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,3072,0.1378951072692871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,2560,0.08721777465608384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,2560,0.11911466386583115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,1024,0.018561777141359117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,2048,0.07188266515731812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,2048,0.10095644659466213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,768,0.01420177850458357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,1536,0.05791022380193075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,1536,0.08233066399892171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,512,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,1024,0.063609778881073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,1024,0.04282933473587036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,256,0.008949333594905006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,768,0.034796443250444196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,768,0.05397866831885444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,128,0.008284444610277811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,512,0.04382133483886719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,512,0.02814399864938524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,64,0.007269333634111617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,256,0.03500977820820279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,256,0.022983999715911016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,32,0.007641777396202087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,128,0.02163644466135237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,4096,128,0.030593779351976182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,64,0.021029333273569744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,5120,0.07994844516118367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,4096,32,0.02092444399992625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,16384,0.22873332765367296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,4096,1536,0.02385422256257799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,51200,0.6872933175828723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,65536,0.9075351291232638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,12288,0.19240800539652506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,16384,0.5333626535203722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,10240,0.13455466429392496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,12288,0.44170488251580137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,16384,0.6735271347893609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,8192,0.11208889219495986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,12288,0.5626595815022787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,51200,1.724039077758789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,7168,0.0955137809117635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,65536,2.19174936082628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,8192,0.3518417676289876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,6144,0.0821395582622952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,7168,0.23871911896599662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,51200,2.053420384724935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,7168,0.3047555552588569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,6144,0.19640444384680855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,5120,0.06901688708199395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,6144,0.2599715656704373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,10240,0.3422533406151666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,5120,0.159861339463128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,4096,0.05554044577810499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,65536,2.6268702612982855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,5120,0.21655910544925264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,4096,0.12685155868530273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,4096,0.17638133631812203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,8192,0.2633102205064562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,3072,0.03830488853984409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,3584,0.1121893326441447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,3584,0.15674132770962185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,2560,0.03278933299912347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,2048,0.02754222187731001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,3072,0.09725066688325669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,3072,0.13759288522932264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,2560,0.08291822009616427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,2560,0.11805066797468398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,1536,0.021760000122918025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,1024,0.015997333659066092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,2048,0.09993600183063084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,1536,0.08119733466042413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,1536,0.0540284448199802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,768,0.012815111213260226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,1024,0.03975644376542833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,1024,0.06312177578608195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,512,0.010332444475756751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,768,0.054104000329971313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,256,0.007675555845101674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,512,0.04264800084961785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,512,0.026919111609458923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,128,0.006999111009968652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,256,0.02176977859603034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,256,0.034972445832358465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,3584,0.04519288738568624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,64,0.006607999818192587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,128,0.020234665936893888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,128,0.028797331783506606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,64,0.019897777173254225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3584,10240,0.43503377172682023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,32,0.01957066688272688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,2048,0.06692177719540067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,51200,0.5232515335083008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,65536,0.6855120129055448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3584,768,0.033032000064849854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,16384,0.1950275500615438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3584,32,0.006559999866618051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,12288,0.13047377268473306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,16384,0.48995288213094074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,10240,0.11667022440168594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,16384,0.6698533164130317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,12288,0.3709093464745416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,8192,0.09134844276640151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,12288,0.4852995342678494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,10240,0.31040533383687335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,7168,0.07750844293170504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,51200,1.6236338085598414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,65536,2.0909190707736545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,8192,0.2492764525943332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,6144,0.07439021931754218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,10240,0.4126533402336969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,8192,0.33099733458624947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,5120,0.05954844421810574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,7168,0.21869156095716688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,7168,0.2896408769819471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,4096,0.04506311151716444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,6144,0.18510044945610893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,6144,0.24666221936543783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,3584,0.040227555566363864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,5120,0.15239200327131483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,5120,0.20603111055162218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,3072,0.03411644366052415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,4096,0.12038311693403457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,2560,0.02879200047916836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,65536,2.4806560940212674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,3584,0.10667288965649074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,51200,1.9499030643039281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,3072,0.09335288736555312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,2048,0.02546399997340308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,1536,0.02027555637889438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,2560,0.07897955841488309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,2560,0.11274400022294785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,2048,0.06427022483613756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,2048,0.09497955772611831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,1536,0.0496782230006324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,1536,0.07788355482949151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,768,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,1024,0.06060355239444309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,1024,0.03831911087036133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,512,0.010031999813185798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,768,0.03121244576242235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,768,0.05089955528577169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,256,0.007253333098358578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,512,0.025535111625989277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,128,0.006694222076071634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,256,0.032799998919169106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,128,0.01920711166328854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,4096,0.1669680012596978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,128,0.02882400155067444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,64,0.006251555350091722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,32,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,3584,0.14892178111606175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,3072,0.13042488363054064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,32,0.018560889694425795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,3072,1024,0.015635554989178974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,65536,0.62318664126926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,3072,512,0.041413333680894636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,256,0.020584889584117465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,51200,0.4924169116550022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,16384,0.15219288402133518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,3072,64,0.01886755559179518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,16384,0.4756933318244086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,12288,0.1246604389614529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,16384,0.6019946734110514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,12288,0.3508231110042996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,10240,0.10701066917843288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,65536,1.8687733544243708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,12288,0.45819732877943253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,8192,0.08568000131183201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,51200,1.4800764719645183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,10240,0.29452265633477104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,7168,0.07280977567036946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,10240,0.3848915629916721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,8192,0.23678665690951875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,6144,0.06389600038528442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,8192,0.3121182123819987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,7168,0.20607022444407144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,5120,0.05549955699178907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,7168,0.27373067537943524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,6144,0.17546044455634224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,51200,1.829437255859375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,6144,0.2329111099243164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,4096,0.03955644369125366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,5120,0.14305688275231257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,3584,0.03494755427042643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,5120,0.1938542260064019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,3072,0.028352889749738906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,4096,0.1143075492646959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,2560,0.024146666129430134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,3584,0.1001360019048055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,4096,0.15806933244069418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,3584,0.14073333475324842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,2048,0.02141422198878394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,3072,0.08697599834865993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,1536,0.016696888539526198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,3072,0.12347911463843451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,2560,0.07392711109585233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,2560,0.10616088575787014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,1024,0.012480888929631976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,2048,0.09002133210500081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,768,0.010019555687904358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,1536,0.07363555828730266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,1536,0.04788355694876777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,512,0.00831822223133511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,1024,0.03594933284653558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,768,0.04751911097102695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,768,0.029115554359224107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,512,0.02408444384733836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,512,0.04066844450102912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,128,0.005922666854328579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,256,0.03263377812173631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,256,0.019552888141738046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,64,0.005535999933878581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,32,0.005560889012283749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,128,0.017875555488798354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,128,0.02769777841038174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,64,0.017850667238235474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,32,0.01774488886197408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,65536,2.338528103298611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,65536,0.5128782060411241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,51200,0.3838515546586778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,16384,0.1260346704059177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2560,2048,0.06160000297758314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2560,1024,0.05645689037111071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2560,256,0.00684799998998642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,12288,0.09640977780024211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,16384,0.45375908745659727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,12288,0.3312906689114041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,10240,0.07845599783791436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,16384,0.5994497934977213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,8192,0.06594933403862847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,12288,0.4548853238423665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,51200,1.3683599895901148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,10240,0.27823734283447266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,7168,0.054535110791524254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,65536,1.7473138173421223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,10240,0.38597689734564883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,8192,0.22252888149685332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,6144,0.04648355642954508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,8192,0.31030310524834526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,5120,0.04172888729307386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,7168,0.19581866264343262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,7168,0.2718675666385227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,4096,0.03155644403563605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,6144,0.1650986671447754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,6144,0.23208888371785483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,3584,0.030065778228971694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,5120,0.13548621866438124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,5120,0.19321689340803358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,3072,0.024578667349285547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,4096,0.10732266638014053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,4096,0.15636266602410212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,2560,0.021799999806616042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,3584,0.09449866745207046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,3584,0.13918044832017687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,3072,0.08284355534447564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,3072,0.12248355812496609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,51200,1.8236079745822484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,65536,2.325484381781684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,2560,0.07077155510584514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,1536,0.013501333693663279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,2560,0.10559555557039048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,1024,0.010404444403118556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,2048,0.057320886188083224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,2048,0.08957778082953559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,768,0.008642666869693333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,1536,0.04531200064553154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,1536,0.07300000058280097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,1024,0.03298577666282654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,768,0.0277528895272149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,256,0.006050666587220297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,512,0.022703111171722412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,512,0.03878755701912774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,128,0.005208888815508948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,256,0.031574222776624895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,256,0.018246221873495314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,64,0.004927999857399198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,128,0.017066667477289837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,32,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,128,0.026896889011065166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,64,0.01648888819747501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,2048,32,0.01648355523745219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,2048,0.018565333551830716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,65536,0.37110577689276797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,51200,0.2818151050143772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,1024,0.054921779367658824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,2048,768,0.046910223033693105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,16384,0.09459377659691705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,16384,0.4132675594753689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,12288,0.0708106689982944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,16384,0.5630995432535807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,65536,1.63390933142768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,12288,0.3138622177971734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,10240,0.05963200330734253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,2048,512,0.0069226668112807805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,12288,0.4281040032704671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,8192,0.051273776425255664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,7168,0.04552177919281853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,10240,0.2637857860989041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,10240,0.3601840072207981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,8192,0.21126933892567953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,6144,0.03809600075085958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,8192,0.2925706704457601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,7168,0.18508622381422254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,65536,2.1805786556667752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,5120,0.030271109607484605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,7168,0.2558808856540256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,4096,0.024775111012988623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,51200,1.7139768600463867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,6144,0.15636711650424534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,3584,0.02295644415749444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,6144,0.2185831069946289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,5120,0.1276844475004408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,3072,0.02068088948726654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,5120,0.18105599615308973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,4096,0.10162933005226983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,2560,0.017785777648289997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,3584,0.13089956177605525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,2048,0.014811555544535318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,3072,0.07823555337058173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,2560,0.06644888718922932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,2560,0.09968266884485881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,1536,0.012207110722859701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,2048,0.05464355481995476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,2048,0.08501155508889092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,1024,0.00963644435008367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,1536,0.04242488741874695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,1536,0.06864088773727417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,768,0.008634666601816813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,1024,0.03120888935195075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,1024,0.051890667941835195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,512,0.006908444480763541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,768,0.026314665873845417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,256,0.005561777700980504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,512,0.021486222743988037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,512,0.037335998482174344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,128,0.004795555439260271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,256,0.01723288827472263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,256,0.030142221185896132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,64,0.004553777890072929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,128,0.015815999772813585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,128,0.025861332813898723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1536,32,0.004589333302444882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,64,0.015463110473420886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,4096,0.1470479965209961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,32,0.015126221709781222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,3584,0.08997778097788493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,65536,0.2604160043928358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1536,51200,1.288317362467448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,51200,0.19969599776797822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,16384,0.07142221927642822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,768,0.04471022221777174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,16384,0.39687111642625594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,12288,0.04892444279458788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,16384,0.5588906606038412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,12288,0.29331199328104657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,51200,1.1807173622979057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1536,3072,0.1148880057864719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,65536,1.5032978057861328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,8192,0.03163999981350369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,10240,0.24428534507751465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,12288,0.425272888607449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,10240,0.3582924471961127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,8192,0.19650844732920328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,51200,1.6999279657999675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,6144,0.02513866623242696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,8192,0.29062043295966256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,7168,0.1716817749871148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,5120,0.02258577777279748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,7168,0.25410487916734487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,65536,2.169595506456163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,6144,0.14596711264716253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,4096,0.018295110927687753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,6144,0.21771910455491808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,5120,0.11851555771297878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,5120,0.18018221855163574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,4096,0.09350399838553534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,4096,0.14591466055976018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,3072,0.014642667439248828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,3584,0.08222488562266032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,3584,0.13053422504001194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,2560,0.01241422196229299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,3072,0.07153155406316121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,3072,0.11471911271413167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,2048,0.011055111057228513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,2560,0.09881689151128133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,1536,0.008752000000741746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,2048,0.08366844389173721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,2048,0.049545778168572314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,7168,0.029612445169025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,1536,0.0380968881977929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,1536,0.06815644767549303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,768,0.006245333287451003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,1024,0.028833776712417603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,1024,0.051346666283077665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,768,0.02405511173937056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,512,0.005504888792832692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,768,0.04481155673662821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,256,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,512,0.03679200013478597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,3584,0.016231111354298063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,256,0.029470221863852605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,128,0.003912888881233004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,64,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,10240,0.04171644316779243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,1024,128,0.02541422181659275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,32,0.003942222230964237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,64,0.01443822185198466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,32,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,65536,0.19924978415171304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,2560,0.06045689185460409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,51200,0.15791911549038357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,1024,1024,0.006912888752089606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,16384,0.05161955621507433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,16384,0.3726782268948025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,512,0.01994755533006456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,256,0.016176000237464905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,12288,0.03974755605061849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,1024,128,0.014768888552983602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,10240,0.03301066822475857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,12288,0.28244177500406903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,51200,1.1399715211656358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,65536,1.4527004030015733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,8192,0.026526222626368206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,12288,0.398310210969713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,10240,0.23669245507982042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,7168,0.02258311046494378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,8192,0.19086133109198677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,10240,0.33481423060099286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,8192,0.27225510279337567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,6144,0.019703111714786954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,7168,0.16631910536024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,7168,0.23873154322306314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,5120,0.017083555459976196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,4096,0.014416888356208801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,51200,1.5925910737779405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,6144,0.140721771452162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,5120,0.11429156197441949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,6144,0.2029199997584025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,3584,0.013057777451144325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,5120,0.16854222615559897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,4096,0.09042755762736003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,65536,2.0256498124864364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,3072,0.011715555356608497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,2560,0.01038044442733129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,4096,0.13716444704267713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,3584,0.08024711079067655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,3584,0.12178222338358562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,3072,0.06969866487714979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,2048,0.009017777939637503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,2560,0.0581644442346361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,1536,0.007575111256705389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,2560,0.09233333004845513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,1024,0.006498666687144174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,2048,0.07822755310270521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,1536,0.06418933471043904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,1536,0.03636622097757127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,768,0.005551110953092575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,1024,0.028138667345046997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,16384,0.524504025777181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,1024,0.048603554566701256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,512,0.004872000051869286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,256,0.0041884444653987885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,768,0.023341332872708637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,512,0.01955911186006334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,128,0.0038444445365005066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,256,0.02847911251915826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,256,0.015478221906556023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,64,0.0035777779089079965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,128,0.024362666739357844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,128,0.014104889498816596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,768,32,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,64,0.013754666679435305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,32,0.013468444347381592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,65536,0.16381866402096218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,51200,0.1254782279332479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,3072,0.10754044188393487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,768,2048,0.04720977942148844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,16384,0.04168355464935303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,768,0.041610668102900185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,768,512,0.0350835555129581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,12288,0.03261155552334256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,16384,0.3613484435611301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,10240,0.02532888948917389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,12288,0.27419643931918675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,16384,0.5221164491441515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,65536,1.4069218105740016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,51200,1.1140320036146376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,8192,0.01999288962946998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,10240,0.23010489675733778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,12288,0.39668620957268613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,8192,0.18496621979607475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,10240,0.33400623003641766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,6144,0.016141333513789706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,8192,0.27170221010843915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,5120,0.014127110441525778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,7168,0.23768533600701225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,51200,1.5815288755628798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,6144,0.13682133621639675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,4096,0.011924444801277585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,6144,0.20293866263495552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,5120,0.11125777827368842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,65536,2.0209742652045355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,3584,0.010857777463065254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,5120,0.16786577966478136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,3072,0.010042666561073726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,4096,0.08715199761920506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,4096,0.1368186606301202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,2560,0.01034222212102678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,3584,0.0772248903910319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,3584,0.12184533807966445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,3072,0.10720800028906928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,2048,0.009002666506502364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,1536,0.007650666766696506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,2560,0.056464003192053906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,2560,0.09229777918921576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,1024,0.006236444330877728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,2048,0.04555999901559618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,2048,0.07818844583299425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,1536,0.03489866521623399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,768,0.0052639999323421055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,1536,0.062215997113121875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,7168,0.018059555027219985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,512,0.004515555583768421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,1024,0.04796977837880453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,768,0.041744887828826904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,768,0.022664000590642292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,512,0.034677333301968045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,128,0.003636444608370463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,7168,0.16154311762915716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,128,0.01348000019788742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,128,0.02444177700413598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,64,0.013453333742088742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,32,0.0033662221911880705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,3072,0.06731644603941175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,32,0.01310400002532535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,65536,0.10462311241361831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,1024,0.02699022160636054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,256,0.0041848888827694785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,51200,0.08307644393708971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,512,0.018906666172875296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,16384,0.03249511122703552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,512,256,0.014848889576064216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,512,64,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,12288,0.023901333411534626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,16384,0.3497600025600857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,16384,0.5173884497748481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,12288,0.2661191092597114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,10240,0.021007110675175984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,65536,1.3632870780097113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,51200,1.0677813424004448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,10240,0.22353243827819824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,12288,0.3934408823649089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,10240,0.33080267906188965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,512,256,0.02779200010829502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,7168,0.01479555500878228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,8192,0.17984978357950845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,6144,0.013691555294725629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,8192,0.2689022223154704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,51200,1.567850642734104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,65536,1.9976505703396266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,5120,0.011505777637163797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,7168,0.2364284462398953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,6144,0.13244356049431696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,4096,0.008647110727098253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,6144,0.2010248899459839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,3584,0.00795999997191959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,5120,0.10787733395894368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,5120,0.16676089498731825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,4096,0.0844951139556037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,3072,0.007271111011505127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,4096,0.13522666030459934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,2560,0.006620444357395172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,3584,0.07429333527882893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,3584,0.12071643935309516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,3072,0.06498399708006117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,3072,0.10572266578674316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,2048,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,2560,0.0540960000620948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,1536,0.004981333182917701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,8192,0.017503110898865592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,2560,0.09104800224304199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,1024,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,2048,0.07772622505823772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,1536,0.06146933635075887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,768,0.0041573333243529005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,1536,0.03382844395107693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,512,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,1024,0.047351999415291675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,1024,0.026102221674389307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,256,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,768,0.040779554181628756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,768,0.022058667408095464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,128,0.003378666730390655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,512,0.034056001239352755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,256,0.02752799954679277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,256,0.01443822185198466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,64,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,7168,0.1570542256037394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,256,32,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,128,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,65536,0.06934755378299289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,64,0.012626666989591388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,32,0.012431999875439538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,51200,0.05457244316736857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,16384,0.018586667047606576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,2048,0.043856001562542386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,256,512,0.018565333551830716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,16384,0.34042755762736004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,12288,0.01479466590616438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,256,128,0.02330133318901062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,51200,1.0374249352349174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,10240,0.013198222551080914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,16384,0.5163048638237847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,65536,1.324586656358507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,8192,0.011947555674446953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,12288,0.25832443767123753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,7168,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,10240,0.2169919941160414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,12288,0.3919235600365533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,8192,0.17482844988505045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,10240,0.33088000615437824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,51200,1.5625129275851781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,8192,0.26835110452440053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,7168,0.15278400315178767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,7168,0.23504887686835396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,6144,0.12877866956922743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,4096,0.008681777450773451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,6144,0.20081778367360434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,5120,0.1046924458609687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,65536,1.995497809516059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,3584,0.008058666355080074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,5120,0.1663422187169393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,3072,0.007259555160999298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,4096,0.08180622259775798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,4096,0.13462755415174696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,3584,0.07237688700358073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,2560,0.0069102222720781965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,3584,0.1202204492357042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,3072,0.06286488638983832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,2048,0.005558222118351195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,3072,0.1049777799182468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,1536,0.004862222406599256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,2560,0.05198488963974846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,1024,0.0041724443435668945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,2560,0.09076888693703546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,2048,0.07561688952975802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,2048,0.04244800077544319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,1536,0.06198133362664116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,1536,0.03324888812171088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,768,0.0038897775941424896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,512,0.0035439998739295532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,1024,0.025412445267041523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,1024,0.04758222235573662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,768,0.02161066730817159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,256,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,512,0.017625777257813346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,512,0.033801777495278254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,128,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,6144,0.011329777538776398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,256,0.02739199995994568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,256,0.014114666316244336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,32,0.0028862222615215513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,128,0.01241422196229299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,5120,0.009696889254781935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,64,0.012256888879670037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,65536,0.06315733326805963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,128,32,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,51200,0.05099822084108988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,16384,0.014888000157144336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,12288,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,16384,0.3402720027499729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,12288,0.2584471172756619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,10240,0.010729778144094678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,8192,0.009711110757456886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,10240,0.2168977790408664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,768,0.04072177741262648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,8192,0.17451111475626627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,7168,0.00942666663063897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,6144,0.008965333302815756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,5120,0.008323555191357931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,128,64,0.0028524444335036804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,51200,1.037011570400662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,4096,0.007624000310897827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2816,128,128,0.02308888898955451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,7168,0.15267111195458308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,3072,0.00657155571712388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,5120,0.10382311211691962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,65536,1.3259155485365126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,2560,0.0058986664646201665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,4096,0.08169600036409166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,2048,0.005246222019195557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,3584,0.07150933477613661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,1536,0.004912000149488449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,3072,0.062205334504445396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,1024,0.004182222402758068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,768,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,2560,0.05215555429458618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,2048,0.04084711273511251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,256,0.003208000005947219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,1024,0.025363556212849084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,768,0.021543999512990315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,128,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,512,0.017838221457269456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,64,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,256,0.013814222481515674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,32,0.00299822228650252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,128,0.012427555190192329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,65536,0.06640177965164185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,64,0.012063999970753988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,32,0.011719110939237805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,51200,0.05265511075655619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,16384,0.013008889224794177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,12288,0.010710222025712332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,16384,0.3404097821977403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,6144,0.1286275519265069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,12288,0.25809423128763836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,10240,0.009663110805882348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,8192,0.008671999805503422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,7168,0.008385777473449707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,10240,0.21669956048329672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,8192,0.17436622248755562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,512,0.0035297779573334586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,6144,0.008000888758235509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,7168,0.1523324383629693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,64,1536,0.032241778241263494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,4096,0.007975999679830339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,3584,0.007291555404663086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,51200,1.03693421681722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,6144,0.12849777274661595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,5120,0.10383111238479614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,3072,0.0069208890199661255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,4096,0.08130488793055217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,2560,0.006630222416586346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,2048,0.00526577772365676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,3584,0.07201955715815227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,1536,0.0046951112647851305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,65536,1.326314714219835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,1024,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,768,0.0038284444146686127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,3072,0.062479999330308705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,2048,0.0421324438518948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,1536,0.03269866771168179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,1024,0.025418667329682246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,256,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,768,0.02121155626244015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,128,0.0028026666906144884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,512,0.01790577835506863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,64,0.00254133323000537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,256,0.013765333427323235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,64,3584,0.007281777759393056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,128,0.01238844460911221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,64,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,32,0.011742221812407175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,5120,0.007401777638329401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2816,32,2560,0.05191822184456719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2816,32,512,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,12288,2.421856986151801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,10240,2.1689866383870444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,16384,3.207699457804362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,12288,2.8793777889675565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,16384,3.940773434109158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,8192,1.625083605448405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,7168,1.6281653510199652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,8192,1.8177920447455511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,10240,2.299544016520182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,7168,1.5491857528686523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,6144,1.4119226667616103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,5120,1.174947526719835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,5120,1.0932756000094943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,4096,0.8205155796474881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,6144,1.3207520378960502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,3584,0.8040444586012098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,4096,0.8722995652092828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,2560,0.5064835548400879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,3072,0.6139715512593588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,2048,0.48598490820990664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,3072,0.8109413252936469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,2560,0.5941875775655111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,1536,0.35735556814405656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,3584,0.8795546425713433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,1024,0.2289342350429959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,2048,0.5546737776862251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,1536,0.45658312903510195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,1024,0.2754631042480469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,512,0.13476978407965765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,768,0.21716888745625815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,256,0.11166400379604763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,128,0.08421244223912557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,512,0.18897067175971138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,64,0.07902755339940389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,32,0.07270399729410808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,256,0.1643679936726888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,128,0.15469333860609266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,64,0.15921600659688315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,32,0.1619173288345337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,768,0.2063911093605889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,65536,51200,10.579723782009548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,16384,2.556718190511068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,16384,3.183504104614258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,12288,1.9529351128472223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,12288,2.2632613711886935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,10240,1.5353590647379558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,8192,1.2660693062676323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,10240,1.8313458760579426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,8192,1.4475875430636937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,7168,1.1009492874145508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,51200,7.9380340576171875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,7168,1.2237698237101238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,65536,51200,16.283252292209202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,6144,0.8900089263916016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,5120,0.8544480005900065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,4096,0.6893457836574979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,6144,1.0672871271769206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,5120,0.8669102456834582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,4096,0.7362000147501627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,3584,0.6122817993164062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,3072,0.48452266057332355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,2560,0.35875466134813094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,3072,0.5238409042358398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,3584,0.7472986645168729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,2048,0.34520355860392254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,1024,0.1873333321677314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,1536,0.22492800818549263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,65536,10.237336900499132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,1536,0.2962879869672987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,2048,0.3857617908053928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,768,0.12129067050086127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,2560,0.4880062209235297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,256,0.06879378027386136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,1024,0.28381866878933376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,128,0.058550225363837353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,64,0.04973511232270134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,256,0.13216533925798205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,32,0.051162666744656034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,128,0.15380177232954237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,768,0.18115199936760795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,64,0.126620438363817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,32,0.12674310472276476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,51200,512,0.09971377584669326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,512,0.1507342259089152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,16384,0.7639617919921875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,51200,12.657951354980469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,16384,1.1766541798909504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,12288,0.6432871288723415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,51200,2.5331431494818792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,10240,0.440180434121026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,12288,0.8763430913289388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,8192,0.3801040119594998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,65536,3.301080067952474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,10240,0.7264995574951172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,7168,0.34698934025234646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,8192,0.5569741990831163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,6144,0.2922826608022054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,5120,0.24012178844875762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,7168,0.5171093410915798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,6144,0.4366790983412001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,4096,0.19503911336263022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,5120,0.36150399843851727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,3584,0.17767466439141166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,4096,0.2760053210788303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,3072,0.1508853303061591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,3584,0.24504621823628744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,51200,4.3148824903700085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,2560,0.1328159968058268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,2048,0.0985200007756551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,3072,0.2257333331637912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,1536,0.08181866672303942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,1024,0.05681688918007744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,2560,0.18336089452107748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,2048,0.1555404398176405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,768,0.04411377840571933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,51200,65536,15.777399698893229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,512,0.03394488824738397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,1024,0.0900426639450921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,256,0.031515555249320135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,1536,0.11893599563174778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,128,0.022848889231681824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,768,0.07372799846861097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,512,0.06245333618587918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,64,0.019187556372748483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,256,0.05374044511053297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,16384,32,0.019934222102165222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,128,0.05496266815397474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,64,0.05000266763899061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,32,0.05000444584422641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,16384,65536,5.8337207370334205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,16384,0.6151270866394043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,16384,0.9413341946072049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,12288,0.4949670897589789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,10240,0.4359289010365804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,12288,0.6909573343065051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,8192,0.3774880038367377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,7168,0.26599645614624023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,10240,0.5748160150316026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,8192,0.5280266867743598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,51200,1.925076378716363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,6144,0.24036977026197645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,5120,0.19200444221496582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,7168,0.5063511000739204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,6144,0.33719733026292587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,5120,0.30318133036295575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,65536,2.4503182305230036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,3584,0.13861332999335393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,4096,0.23152356677585176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,3072,0.1181102196375529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,2560,0.10355644755893284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,3584,0.19559910562303331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,2048,0.0833466649055481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,1536,0.06328622500101726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,2560,0.1487191120783488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,3072,0.20523999796973336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,1024,0.046394666035970054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,768,0.03833333320087857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,1536,0.09887999958462185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,2048,0.1234862274593777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,512,0.029930667744742498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,256,0.021073778470357258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,1024,0.07471555471420288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,768,0.059402664502461754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,64,0.015480000111791821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,256,0.04327822062704298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,32,0.016145777371194627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,128,0.03860888878504435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,64,0.037348445918824934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,32,0.03843377696143256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,51200,3.448720932006836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,4096,0.16716621981726754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,16384,0.4933635393778483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,65536,4.255003611246745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,12288,128,0.017941332525677152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,12288,512,0.050851556989881724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,12288,0.37244176864624023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,10240,0.3043022155761719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,51200,1.563984023200141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,12288,0.6090542475382487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,8192,0.25640800264146596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,65536,2.09877692328559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,7168,0.21919022666083443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,10240,0.5685066646999782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,6144,0.21315556102328828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,8192,0.4443502161237929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,5120,0.16177954938676622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,6144,0.30390932824876576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,4096,0.1321715513865153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,3584,0.11382133430904812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,5120,0.3026008870866564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,4096,0.19931288560231528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,3072,0.09818844662772284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,3584,0.17518933614095053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,2560,0.08378666639328003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,3072,0.1528044409222073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,2048,0.06825600067774455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,16384,0.8635199864705404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,1536,0.05667022201750013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,2560,0.13105777899424234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,2048,0.10886044634713067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,1536,0.08693244722154404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,768,0.028011557128694322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,512,0.020781333247820537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,1024,0.06565066840913561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,256,0.017087111870447796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,768,0.052783999178144664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,51200,3.064503139919705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,128,0.014527999692493014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,7168,0.4193520016140408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,512,0.043453332450654775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,64,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,32,0.0125608891248703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,256,0.03656355539957682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,128,0.03803999887572394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,32,0.03253511256641812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,65536,4.0409626430935335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,10240,1024,0.03659288750754462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,16384,0.42825955814785427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,12288,0.3549182150099013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,10240,64,0.032976001501083374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,51200,1.526243527730306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,16384,0.7198559972974988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,65536,1.7007697423299153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,10240,0.2780337863498264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,8192,0.2194755607181125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,7168,0.18593955039978027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,12288,0.5507715543111166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,8192,0.370576885011461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,6144,0.1604479948679606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,10240,0.49602402581108945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,5120,0.13723556200663248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,7168,0.30902311537000865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,4096,0.10935288667678833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,3584,0.09425422218110825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,6144,0.2645173337724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,3072,0.08258844746483697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,2560,0.06726133161120944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,5120,0.2199031114578247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,4096,0.17667999532487658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,2048,0.05646222167544895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,3584,0.15302577283647326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,1536,0.044365333186255566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,3072,0.13350844383239746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,1024,0.02983733349376255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,768,0.02444177700413598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,2048,0.09640089008543228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,512,0.017987555927700467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,1536,0.07629688580830891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,51200,2.649806128607856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,1024,0.05752178033192953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,256,0.015623110863897534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,768,0.046182221836513944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,128,0.013443555268976422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,64,0.01037599974208408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,512,0.03769866625467936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,8192,32,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,128,0.029346668057971533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,256,0.030545777744717065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,64,0.02880355715751648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,32,0.02882222334543864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,65536,3.4015750885009766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,16384,0.3675999906327989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,12288,0.29266754786173504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,16384,0.6581146452162001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,8192,2560,0.1266160011291504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,10240,0.23396089341905382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,12288,0.5099466641743978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,8192,0.18740533457862008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,7168,0.1701822280883789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,51200,1.258655971950955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,10240,0.40984710057576496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,65536,1.5034159554375544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,6144,0.14861244625515407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,8192,0.3858231173621283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,5120,0.12201778093973796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,7168,0.2927244504292806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,4096,0.09390044212341309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,3584,0.082424885696835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,6144,0.2681013213263618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,3072,0.07270666625764635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,2560,0.062881780995263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,4096,0.16571022404564753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,3584,0.1427368852827284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,3072,0.12435732947455512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,1536,0.04027022255791558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,2560,0.12183645036485459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,1024,0.027217777238951787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,2048,0.09109866619110107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,768,0.021852445271280076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,1536,0.07158133056428698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,1024,0.0543742212984297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,512,0.017093333933088515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,256,0.012716444830099741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,768,0.043121778302722506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,128,0.011121778024567498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,512,0.035996443695492215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,256,0.028713779317008123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,51200,2.3896107143825955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,64,0.010017777482668558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,32,0.010659555594126383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,128,0.026737777723206416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,64,0.026945778065257605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,32,0.026797332697444495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,5120,0.22568265597025552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,7168,65536,3.1403609381781687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,7168,2048,0.05242222216394213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,16384,0.29439110226101345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,12288,0.22526311874389648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,51200,0.8663946787516276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,10240,0.19015022118886313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,65536,1.1613618002997506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,16384,0.6243199772304958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,8192,0.14996800157758924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,12288,0.47079912821451825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,7168,0.13546044296688503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,10240,0.3992862171596951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,6144,0.11772710747188991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,8192,0.33806488249037003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,5120,0.10115822156270345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,4096,0.07991911305321588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,6144,0.22695199648539224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,3584,0.06833689080344306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,3072,0.05933244360817803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,3584,0.1301706631978353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,2560,0.0500222212738461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,51200,2.1398052639431424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,2048,0.043585777282714844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,2560,0.09893688890669082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,1536,0.034041778908835515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,2048,0.08296533425649007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,65536,2.66833856370714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,1536,0.06515555249320136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,768,0.02150933278931512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,7168,0.2782622178395589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,1024,0.049822221199671425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,512,0.01587377819750044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,768,0.039847999811172485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,256,0.013984888792037964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,128,0.01033688916100396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,5120,0.18836355209350586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,64,0.009007111191749573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,512,0.03256977929009332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,32,0.009013333254390294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,256,0.02641600039270189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,4096,0.14976444509294298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,128,0.025037333369255066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,64,0.02474400069978502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,32,0.024333332975705464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,6144,3072,0.11552711327870686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,16384,0.27512889438205296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,12288,0.20998666021558973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,10240,0.18404711617363823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,6144,1024,0.026526222626368206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,16384,0.5520835452609593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,51200,0.7885386678907605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,8192,0.13827021916707358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,12288,0.4145786762237549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,7168,0.12660888830820718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,65536,1.110838254292806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,6144,0.10357422298855251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,8192,0.27788088056776256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,10240,0.3728417820400662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,4096,0.06813510921266344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,7168,0.24290400081210664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,6144,0.2082986699210273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,3584,0.05765599674648709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,5120,0.1675084431966146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,3072,0.05041866501172384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,2560,0.04518311222394308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,4096,0.1459217733807034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,3584,0.11957421567704941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,3072,0.10441244310802883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,1536,0.029256890217463177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,2560,0.08986310826407538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,1024,0.019908444748984445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,768,0.016228444046444364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,2048,0.07698400153054132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,512,0.013173333472675748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,1536,0.05920355849795871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,1024,0.04423377911249796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,256,0.009705777797434065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,51200,1.860195583767361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,768,0.03649866580963135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,128,0.008971555365456475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,512,0.030024889442655776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,64,0.00814488861295912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,32,0.008622222476535374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,256,0.024333332975705464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,128,0.02295733326011234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,64,0.022687110635969374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,32,0.022289777795473736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,5120,65536,2.398056877983941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,5120,0.09140621953540379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,16384,0.21278933684031168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,51200,0.5920275582207574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,5120,2048,0.034443553951051496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,12288,0.15469511349995932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,65536,0.7888897789849175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,10240,0.1620968845155504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,16384,0.5040435791015625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,8192,0.15253510740068224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,7168,0.117122663391961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,12288,0.40284710460238987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,10240,0.34128178490532773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,6144,0.09568355480829875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,8192,0.25279198752509224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,5120,0.08159822225570679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,7168,0.23593065473768446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,4096,0.06468711296717326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,3584,0.06137688954671224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,6144,0.1913013325797187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,5120,0.1525342199537489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,3072,0.052744001150131226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,4096,0.12825955284966364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,3584,0.10834399859110515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,2048,0.0321395562754737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,3072,0.09616355763541327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,1536,0.02520888878239526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,2560,0.08228000005086263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,1024,0.018388445178667705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,51200,1.6976835462782118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,768,0.015013333823945789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,2048,0.06470844480726454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,512,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,256,0.008646222452322641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,1536,0.054437332683139376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,1024,0.04073511229621039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,128,0.007315555380450354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,768,0.03311199943224589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,512,0.02688177757793003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,64,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,32,0.006633777585294511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,256,0.022026666336589392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,65536,2.1307716369628906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,128,0.020983111527231004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,64,0.020281778441535104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,4096,32,0.020257777637905545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,12288,0.1452702283859253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,16384,0.20237510734134248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,10240,0.12200000551011826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,51200,0.5434444215562608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,16384,0.4763813548617893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,65536,0.6815377871195475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,4096,2560,0.03889155719015334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,8192,0.09307999743355645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,12288,0.3583769003550212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,7168,0.08898044294781154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,6144,0.07228177785873413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,10240,0.30261598692999947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,5120,0.06735644737879436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,4096,0.049916442897584706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,8192,0.24126044909159342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,7168,0.21016621589660645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,6144,0.17738844288720024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,3072,0.035107556316587664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,5120,0.15129600630866155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,4096,0.13383200433519152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,3584,0.10331555869844224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,2048,0.028748446040683325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,3072,0.09054222371843125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,1536,0.023899555206298828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,1024,0.01736000014675988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,2560,0.07871022489335802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,768,0.012950222525331708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,2048,0.06257777743869357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,1536,0.05059733324580722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,1024,0.03990133272276984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,51200,1.5823360019259984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,256,0.007300444775157505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,768,0.03195644418398539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,512,0.02571288910177019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,64,0.006695111178689533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,128,0.01962222158908844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,256,0.020936000678274367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,32,0.00664533343580034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,65536,1.9883679283989801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,64,0.019557333654827543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3584,32,0.019253333409627277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,3584,0.04233155647913615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,2560,0.03151911165979173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,51200,0.41642043325636124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,16384,0.15606489446428087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,65536,0.585369798872206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,12288,0.1166951126522488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,10240,0.1018506685892741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,512,0.0101724440852801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,8192,0.08408177561230129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,12288,0.3420826594034831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,7168,0.07445333401362102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,16384,0.4518417782253689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,10240,0.2892906665802002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,6144,0.0610355536142985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,8192,0.22866667641533744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,5120,0.0483439995182885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,4096,0.04023733403947618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,7168,0.220104005601671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,6144,0.16987110508812797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,3584,0.038188444243537054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,5120,0.1379564470714993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,3072,0.03352888756328159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,4096,0.11061155796051025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,2560,0.029325332906511094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,2048,0.024874667326609295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,3584,0.09911466969384088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,51200,1.4892453087700739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,1536,0.019136889113320243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,1024,0.014542222023010254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,2560,0.07220800055397882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,2048,0.06023999717500475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,1536,0.046951999266942344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,512,0.00960177762640847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,1024,0.0358933342827691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,65536,1.887692345513238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,256,0.007280000381999546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,768,0.029846221208572388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,128,0.006627555522653792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,64,0.0058808889653947614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,512,0.024442666106753882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,256,0.020032000210550096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,32,0.005945777727497949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,128,0.01886666648917728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3584,128,0.007291555404663086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,32,0.018220444520314533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,51200,0.4003431002298991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,65536,0.511557314130995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,16384,0.14940088325076634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,3072,0.08586488829718696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,12288,0.1072853340042962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,3072,768,0.011968000067604912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,10240,0.07882577843136258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,16384,0.4425102339850531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,8192,0.06779644224378797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,12288,0.32328176498413086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,7168,0.06721866793102689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,10240,0.2708417839474148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,6144,0.058918224440680615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,3072,64,0.018534221582942538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,5120,0.04456444581349691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,8192,0.22046844164530435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,4096,0.034076445632510714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,3584,0.03105955653720432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,6144,0.1594346629248725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,51200,1.357950210571289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,5120,0.1314835548400879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,3072,0.02738044493728214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,4096,0.10573066605461968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,2560,0.023000889354281958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,3584,0.09369333585103352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,2048,0.02000799940692054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,1536,0.01588711142539978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,65536,1.736403571234809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,1024,0.011600000162919363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,2560,0.07013689147101508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,768,0.009926222264766693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,2048,0.05783289008670383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,512,0.007816889219813878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,1536,0.044397334257761635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,256,0.0063288890653186375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,128,0.005930666708283954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,1024,0.033597333563698664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,768,0.027923554182052612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,512,0.02306488818592495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,64,0.005551110953092575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,256,0.01889155473974016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2560,32,0.00554933316177792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,128,0.01754666699303521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,64,0.01717511150572035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,32,0.016872889465755887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,16384,0.10406488842434353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,51200,0.2983484533098009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,12288,0.07943644126256307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,65536,0.38999377356635195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,10240,0.06832177771462335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,8192,0.05303200085957845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,7168,0.1888400051328871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,16384,0.39940712187025285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,7168,0.04581955406400892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,12288,0.30279111862182617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,10240,0.25361156463623047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,6144,0.03925866550869412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,5120,0.034267554680506386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,8192,0.20362044705284965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2560,3072,0.08128977484173246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,4096,0.03220266766018338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,7168,0.17710399627685547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,3584,0.024719999896155462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,6144,0.1514328850640191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,5120,0.12197244167327881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,2560,0.019359111785888672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,4096,0.09796444574991862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,3584,0.09013688564300537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,2048,0.01741333305835724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,3072,0.07590044207043119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,1536,0.01367288910680347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,1024,0.010224888722101847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,2560,0.06554133362240262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,51200,1.2454427083333333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,1536,0.041272888580958046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,512,0.0069422221018208405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,1024,0.031121777163611516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,256,0.005894222193294101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,768,0.026380444566408794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,65536,1.5878355238172743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,128,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,512,0.02199288871553209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,64,0.004583999928500918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,32,0.004865777575307422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,256,0.017567111386193168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,128,0.016362667083740234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,64,0.01644088824590047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,32,0.016140444411171805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,65536,0.31255555152893066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,51200,0.2598204347822401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,16384,0.08003999789555867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,3072,0.021807110971874658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,12288,0.06313600142796834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,10240,0.05116533239682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,2048,768,0.008575999902354347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,16384,0.3757182227240668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,12288,0.2852364381154378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,10240,0.24712710910373262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,8192,0.04008533226119147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,7168,0.03567911187807719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,6144,0.03155644403563605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,5120,0.027335999740494624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,8192,0.19169333246019152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,7168,0.16660977734459773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,4096,0.021735111872355144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,6144,0.1407359970940484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,3584,0.019687111179033916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,3072,0.017709333035680983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,4096,0.09201155768500434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,2560,0.016120889120631747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,2048,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,65536,1.4841893513997395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,3072,0.07125866413116455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,1536,0.011026666396194033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,1024,0.008638222184446123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,2560,0.060898668236202665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,2048,0.04874222146140205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,768,0.00756533361143536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,1536,0.03816533419820998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,512,0.006256000035338932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,256,0.0052560000783867305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,1024,0.02917511264483134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,128,0.004570666700601578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,768,0.02504088812404209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,512,0.020953777763578627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,64,0.004517333375083076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1536,32,0.004497777670621872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,2048,2048,0.05479910969734192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,128,0.015469332536061605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,64,0.015488889482286243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,32,0.01479022204875946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,65536,0.2208497789171007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,51200,0.18344622188144258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,16384,0.06597244739532471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,12288,0.048194666703542076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,5120,0.11871377627054851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,10240,0.03750311003790961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,3584,0.08227555619345771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,8192,0.027832001447677612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,16384,0.35344799359639484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,12288,0.28080712424384224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,7168,0.024117334021462336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,6144,0.020773332979944017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,10240,0.22531467013888887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,5120,0.019630221856964957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,8192,0.18104799588521323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,4096,0.01601777805222405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,7168,0.16018133693271214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,6144,0.132259554333157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,3584,0.014415999253590902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,256,0.01683022247420417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,3072,0.013061333033773633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,5120,0.10673155387242635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,51200,1.0812959671020508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,2560,0.011415999796655444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,4096,0.08622666862275864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,2048,0.009760888914267222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,1536,0.008330666356616551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,3584,0.07699111435148451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,3072,0.06720355484220716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,65536,1.381232049730089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,2560,0.05551200111707052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,2048,0.04520710971620348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,768,0.005909333212508096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,512,0.004896000027656555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,256,0.004541333350870344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,1536,0.03588533401489258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,1024,0.027764444549878437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,128,0.003966222206751506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,768,0.023353776997990076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,512,0.019686222076416016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,32,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,256,0.015826667348543804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1536,51200,1.1602950625949435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,128,0.014475555883513557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,64,0.013819555441538492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,1024,32,0.013759111364682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,65536,0.1877439949247572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,51200,0.15041155285305446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,16384,0.04963555600908068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,12288,0.036680890454186335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,10240,0.03231199913554721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,12288,0.26055910852220326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,16384,0.3425449000464545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,8192,0.024736889534526404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,10240,0.21822844611273873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,7168,0.022099556194411382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,6144,0.019698666201697457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,8192,0.1746302180820041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,5120,0.01681600014368693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,6144,0.12804355886247423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,4096,0.014386667145623101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,64,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,51200,1.0458692974514432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,3584,0.011216888825098673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,5120,0.10419466760423447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,3072,0.010348444183667501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,2560,0.009321778184837764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,4096,0.0833466649055481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,2048,0.008162666526105668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,3584,0.07361421982447307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,3072,0.06505688693788317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,1536,0.0069191112286514705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,2560,0.05386044581731161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,1024,0.005596444424655702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,768,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,2048,0.04366933306058248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,512,0.004514666481150521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,1536,0.03425511055522495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,256,0.004211555752489301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,768,0.022635555929607813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,512,0.01891377733813392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,256,0.015160888433456421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,64,0.003867555409669876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,128,0.013809777796268463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,32,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,64,0.013746666411558786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,1024,1024,0.006643555644485686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,7168,0.15202311674753824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,32,0.013245333400037555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,65536,0.16342222690582275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,51200,0.1299333307478163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,16384,0.03466399841838413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,12288,0.025729777084456548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,65536,1.3321190940009224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,10240,0.020560888780487906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,16384,0.33265601264105904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,12288,0.2521955437130398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,8192,0.016728889611032274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,768,1024,0.02684088879161411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,6144,0.013336000343163809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,768,128,0.004171555654870139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,5120,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,7168,0.14728889200422499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,4096,0.010051555931568146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,6144,0.1241333352194892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,51200,1.0118044747246635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,3584,0.009372444616423713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,3072,0.008639111287064022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,5120,0.10048977533976237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,2560,0.007600000335110559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,4096,0.08071111308203803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,65536,1.2930444081624348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,2048,0.006612444503439798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,3584,0.07114399804009332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,1536,0.00591466658645206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,3072,0.061575108104281955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,2560,0.05170933405558268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,2048,0.041801777150895864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,768,0.004506666627195147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,512,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,1024,0.02587466604179806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,256,0.0035439998739295532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,768,0.021758221917682227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,512,0.018235555953449674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,256,0.014687110980351767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,64,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,128,0.013407111167907715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,7168,0.014764444695578681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,32,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,10240,0.21118933624691436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,64,0.013304000099500021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,65536,0.0806515547964308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,32,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,8192,0.16945155461629233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,51200,0.06487377484639485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,16384,0.02488533324665493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,12288,0.018630221486091614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,16384,0.3215999868181017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,1024,0.005052444421582752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,12288,0.2438817818959554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,10240,0.01885600056913164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,8192,0.01592088904645708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,7168,0.01461866663561927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,512,1536,0.033117334047953285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,6144,0.012824888858530255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,8192,0.1641182237201267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,512,128,0.0032266666077905228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,5120,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,7168,0.14174666669633654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,4096,0.011171555353535546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,51200,0.9776710934109158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,6144,0.11967733171251084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,3584,0.007970666719807519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,3072,0.007306666837798224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,2560,0.0063546668324205614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,4096,0.07738933298322889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,3584,0.06867822011311848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,3072,0.05936888853708903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,1536,0.005091555416584015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,2560,0.04879200127389696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,1024,0.004519111166397731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,2048,0.040476444694730974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,768,0.0041893331540955436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,1024,0.025067556235525344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,512,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,768,0.02104266650146908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,256,0.003478222423129611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,512,0.017901332841979135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,128,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,256,0.01402666668097178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,64,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,128,0.012729778057999082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,10240,0.20461866590711805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,32,0.002895999906791581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,64,0.012383999923865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,65536,0.06028711133533054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,32,0.012472888661755456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,51200,0.05052888724539015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,16384,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,65536,1.2469120025634766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,12288,0.013066666821638743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,1536,0.031896889209747314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,10240,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,12288,0.2367644574907091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,8192,0.011018666956159802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,10240,0.19889956050448945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,7168,0.012303999728626676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,8192,0.15875021616617838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,51200,0.9467653698391385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,6144,0.011930666863918304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,5120,0.010438222024175854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,65536,1.2111440234714084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,4096,0.008664000365469191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,7168,0.13777421580420599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,6144,0.11593333880106609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,3584,0.00793511089351442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,256,5120,0.09697155819998847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,3072,0.007305777735180325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,5120,0.09354666868845622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,2560,0.006253333141406377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,2048,0.005566222386227713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,256,2048,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,1536,0.004906666775544484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,1024,0.004171555654870139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,3072,0.05714755588107639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,2560,0.04803644286261665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,2048,0.038740442858801946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,768,0.0038444445365005066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,1536,0.030869334936141968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,256,0.0032071111102898917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,768,0.020602666669421725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,512,0.01740622189309862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,128,0.0031822222388452957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,64,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,256,0.013462222284740873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,32,0.002895111011134254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,128,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,64,0.012358222570684222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,65536,0.06001955270767212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,32,0.011742221812407175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,51200,0.04719822274314033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,16384,0.013449778159459433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,16384,0.3117289013332791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,4096,0.07459111346138848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,12288,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,3584,0.06691466437445746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,10240,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,8192,0.01033155537313885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,128,512,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,16384,0.3115226692623562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,12288,0.23626399040222168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,6144,0.009313777916961247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,51200,0.9468026691012912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,8192,0.15903377532958984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,5120,0.009006222089131674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,7168,0.13709155718485513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,4096,0.007641777396202087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,65536,1.209620475769043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,6144,0.11549688710106744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,3584,0.007293333609898885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,3072,0.006608888920810487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,4096,0.07430844174491034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,3584,0.06594577762815687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,2560,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,2048,0.005280888742870755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,3072,0.05695733096864489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,1536,0.00490133340160052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,2048,0.037885334756639265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,2560,0.046763555871115796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,1024,0.0041680000722408295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,1536,0.031215111414591473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,768,0.0038720000949170855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,512,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,1024,0.024119110571013555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,768,0.020655110478401184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,128,1024,0.024488889508777197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,128,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,10240,0.19850488503774008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,64,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,128,0.01240355521440506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,32,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,64,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,5120,0.09326577848858303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,32,0.0120319997270902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,65536,0.05732444259855482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,51200,0.04599200023545159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,16384,0.012480888929631976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,16384,0.31118665801154244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,12288,0.01073333372672399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,256,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,64,7168,0.010683555569913654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,256,0.013528000149461957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,12288,0.2364764478471544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,8192,0.00902133352226681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,51200,0.9463013543023003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,7168,0.008612444831265343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,6144,0.007989333735571967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,10240,0.19844978385501436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,5120,0.010915555887752108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,65536,1.2088204489813912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,7168,0.13698666625552708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,4096,0.009008888569143083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,6144,0.11566932996114095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,3584,0.008622222476535374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,5120,0.09330755472183228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,3072,0.007984889050324758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,2560,0.0069617778062820435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,4096,0.07501777675416735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,2048,0.005210666606823604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,3584,0.06685422526465522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,1536,0.004582222137186262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,3072,0.05681688918007744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,1024,0.003906666818592283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,2560,0.04661600126160515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,768,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,512,0.0034871109657817413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,2048,0.037780443827311196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,256,0.002982222164670626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,1024,0.024280889166726008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,768,0.020623111062579684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,128,0.002893333426780171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,512,0.01720355616675483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,64,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,256,0.013752889302041797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,64,512,0.017186666528383892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,128,0.012100444071822695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,64,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,32,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,8192,0.1585351096259223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2561,32,1536,0.031193776263131037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2561,32,10240,0.009813333551088968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,16384,3.2725599077012806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,12288,2.436994764539931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,16384,3.8362282647026906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,12288,2.7660196092393665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,10240,2.038092507256402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,16384,3.434456083509657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,10240,2.227368884616428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,8192,1.6366035673353407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,12288,2.6372256808810763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,10240,2.134245342678494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,8192,1.7558879852294922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,7168,1.4207866456773546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,6144,1.2825440300835502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,8192,1.7557946311102972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,7168,1.5569368998209636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,7168,1.4732177522447374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,5120,0.9423893822564019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,5120,1.0679066975911458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,6144,1.3110969331529405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,51200,10.694556342230904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,4096,0.772156450483534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,6144,1.2657040490044487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,3584,0.7296320067511665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,4096,0.8449128998650445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,5120,1.0236177444458008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,4096,0.8643004629347059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,3584,0.7648888693915473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,3072,0.5616515477498373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,3072,0.696787569257948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,2560,0.43432799975077313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,2560,0.6713555653889974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,2048,0.3949440055423313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,3072,0.6316337585449219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,3584,0.7114622328016492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,2560,0.5269191000196669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,2048,0.45358578364054364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,1536,0.31258667839898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,1536,0.3703555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,1024,0.20298400190141466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,2048,0.4462569024827745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,768,0.1607795556386312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,1024,0.315757327609592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,1536,0.3605662186940511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,1024,0.26244089338514537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,512,0.12272532780965169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,256,0.08678578005896674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,768,0.214775111940172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,768,0.23285778363545737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,512,0.18501688374413383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,512,0.17643733819325766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,128,0.073161780834198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,64,0.06759555472267999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,256,0.13875555992126465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,256,0.1645875506930881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,128,0.10884444581137763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,65536,32,0.06781244277954102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,128,0.1536924441655477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,64,0.1557395590676202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,32,0.15573067135281032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,65536,51200,15.664752536349825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,65536,51200,11.56592983669705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,16384,2.503941429985894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,16384,3.0892185635036893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,12288,2.0093154907226562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,16384,2.731230205959744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,51200,8.047617594401041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,10240,1.5385253694322374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,65536,10.106207105848524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,12288,2.1915565066867404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,12288,2.0379511515299478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,8192,1.4260124630398219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,10240,1.7975298563639324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,51200,12.38105689154731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,8192,1.4110266367594402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,10240,1.6437973446316188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,7168,1.1670470767550998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,51200,9.231319003634983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,7168,1.225187513563368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,8192,1.3411724302503798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,6144,1.077681753370497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,6144,1.0698764589097765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,5120,0.7781706915961372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,7168,1.1794204711914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,5120,0.8861235512627496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,4096,0.6289813253614638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,65536,15.327753702799479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,4096,0.7185333569844564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,6144,0.9617155922783746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,5120,0.8064906862046984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,3584,0.5537581973605686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,3584,0.6765404277377658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,4096,0.654647085401747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,3072,0.4491288926866319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,3072,0.5441386434766982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,2560,0.4779991043938531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,3584,0.584021356370714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,2048,0.32085778978135854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,2560,0.4426862133873834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,3072,0.5149955749511719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,1536,0.2362284395429823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,2048,0.36259110768636066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,2560,0.44085245662265354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,1536,0.30642578336927623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,2048,0.3648106786939833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,768,0.15686933199564615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,1536,0.28374044100443524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,1024,0.21679111321767172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,512,0.12402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,768,0.1823528872595893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,512,0.14711466100480822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,512,0.146323561668396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,768,0.1743697722752889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,65536,11.866863674587675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,128,0.05576622486114502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,64,0.0469395551416609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,256,0.11389956209394668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,256,0.12913155555725098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,128,0.12205866972605388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,64,0.12335822317335342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,51200,128,0.11910933918423122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,32,0.12336533599429661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,1024,0.1604213317235311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,51200,1024,0.2628355556064182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,256,0.10228355725606282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,51200,32,0.06251821915308635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,16384,0.82714753680759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,51200,2.6454444461398654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,65536,3.301816940307617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,16384,1.162025769551595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,12288,0.6427431106567383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,12288,0.828128867679172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,10240,0.49805688858032227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,16384,1.1257190704345703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,51200,4.058264838324653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,8192,0.40881776809692383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,10240,0.6960719956292046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,12288,0.8417546484205457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,65536,5.4260143703884545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,7168,0.34548089239332413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,10240,0.719687991672092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,6144,0.28804177708095974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,51200,3.672107696533203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,7168,0.5157795482211643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,8192,0.6280426449245876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,6144,0.410866657892863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,5120,0.24538400438096789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,7168,0.5083804660373265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,4096,0.19631644090016684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,5120,0.33885600831773544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,3584,0.16785955429077148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,5120,0.3640684551662869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,4096,0.29413244459364146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,65536,4.716375986735026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,8192,0.5473795466952854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,3072,0.15397689077589247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,4096,0.2931404378679064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,3584,0.23563199573092988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,2560,0.12318489286634658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,3072,0.21693778038024902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,2560,0.17648888958825004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,3072,0.24880711237589517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,2560,0.19468266434139678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,1536,0.07611199882295397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,2048,0.16649866104125977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,1024,0.0532497763633728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,1536,0.13235199451446533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,768,0.04259022076924642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,1024,0.10262044270833333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,1024,0.09010044733683269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,512,0.033424887392256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,768,0.0712675584687127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,768,0.08625155687332153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,256,0.024241778585645888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,6144,0.44243465529547793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,512,0.06072000000211927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,512,0.07224355803595649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,128,0.022243556049134996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,256,0.056559999783833824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,256,0.0520666672123803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,64,0.019152889649073284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,128,0.04907822277810839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,32,0.01969688965214623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,16384,2048,0.10114488999048869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,3584,0.2733999888102214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,64,0.04889511068662008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,32,0.04909333255555895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,2048,0.14556622505187988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,16384,1536,0.11836000283559163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,16384,128,0.04629688792758518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,51200,2.1456097496880426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,16384,0.9269190894232856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,16384,0.6865217950608996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,65536,2.659242630004883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,12288,0.48626311620076496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,10240,0.37032177713182235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,12288,0.678783999549018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,51200,3.3743368784586587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,16384,0.9372871186998156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,12288,0.7154186566670736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,10240,0.6162968741522895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,8192,0.31192445755004883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,8192,0.4580835766262478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,10240,0.5935884581671821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,65536,4.255936092800565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,51200,3.013198216756185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,6144,0.24094756444295248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,8192,0.4805706871880426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,7168,0.4534622298346625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,5120,0.20014222462972006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,6144,0.34005599551730686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,7168,0.42019467883639866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,5120,0.2735688951280382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,4096,0.15760444270239934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,5120,0.30901866488986546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,3584,0.1363875601026747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,6144,0.3683937655554877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,4096,0.2206826607386271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,3072,0.11398933993445502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,4096,0.2457866668701172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,3584,0.22550400098164877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,2560,0.09360266394085354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,65536,3.8579076131184897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,3072,0.17277422216203478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,3584,0.22025867303212485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,2048,0.0802968872918023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,7168,0.2533502313825819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,3072,0.19154666529761422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,2560,0.14474311139848497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,1536,0.059119999408721924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,2560,0.17254400253295898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,1024,0.04298311140802172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,2048,0.12012710836198594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,2048,0.13942755593193903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,768,0.0314702226055993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,1536,0.11276088820563422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,1536,0.09574844439824422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,512,0.025407110651334126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,1024,0.08966133329603408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,1024,0.07616000043021308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,256,0.024904888537194993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,768,0.07446844710244073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,128,0.022273777259720698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,768,0.0591848889986674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,512,0.062237335575951465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,256,0.050682667228910655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,256,0.04136355717976888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,12288,128,0.04064800010787116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,128,0.0376782218615214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,64,0.03691555394066705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,32,0.03674933314323425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,64,0.016819554898473952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,12288,32,0.016905777984195285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,51200,1.7779706319173176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,65536,2.2186080084906683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,16384,0.515059577094184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,12288,512,0.049696889188554555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,12288,0.4020453294118245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,16384,0.8498071034749349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,12288,0.5976062350802952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,10240,0.32716088824801975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,16384,0.8697608841790093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,12288,0.6620408693949381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,10240,0.4982622464497884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,8192,0.266611549589369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,65536,3.7538799709743924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,10240,0.5627982351515028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,7168,0.2374195522732205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,51200,2.957703060574002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,8192,0.3998071087731256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,6144,0.20458132690853545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,7168,0.36621512307061094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,8192,0.44135112232632107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,5120,0.1749875545501709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,6144,0.30500443776448566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,7168,0.3888346619076199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,5120,0.24630043241712782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,4096,0.14014844099680582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,65536,3.485735999213325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,3584,0.11271111170450847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,5120,0.2763982348971897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,51200,2.7413359747992625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,4096,0.19693599806891549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,3072,0.09566489193174575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,4096,0.2265040079752604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,3584,0.21099910471174452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,3584,0.21186489529079863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,2048,0.07521688938140869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,3072,0.15040711561838785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,3072,0.18361955218844941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,2560,0.12945332792070177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,1536,0.051810665263069995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,1024,0.034811556339263916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,2048,0.14185333251953125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,2048,0.10816088649961685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,1536,0.10438666741053264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,1536,0.08735111024644639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,1024,0.06573155853483412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,1024,0.09023911423153347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,512,0.024481778343518574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,768,0.0694133308198717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,768,0.05231644378768074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,256,0.01982399986849891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,512,0.04343822267320421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,512,0.058008001910315625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,128,0.01690933273898231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,256,0.0358915560775333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,256,0.04556177722083198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,6144,0.32999467849731445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,64,0.015492444237073263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,32,0.015564444992277356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,128,0.037575999895731606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,64,0.032984889215893216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,32,0.032391111056009926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,2560,0.08008178075154622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,10240,2560,0.15260444747077093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,10240,768,0.027729777826203242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,16384,0.42268800735473633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,10240,128,0.0332551101843516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,51200,1.288047154744466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,65536,1.6304986741807725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,12288,0.32133155398898655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,16384,0.7454524570041232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,12288,0.5803342395358616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,16384,0.782734235127767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,10240,0.2733413378397624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,12288,0.6167422400580512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,51200,2.4876978132459855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,10240,0.4360693295796712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,8192,0.2225884331597222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,7168,0.1977004475063748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,8192,0.3509511152903239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,10240,0.5062222480773926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,65536,3.3537120819091797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,8192,0.40231911341349286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,6144,0.14860888322194418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,7168,0.31889955202738446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,51200,2.4632445441351996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,5120,0.1347928841908773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,6144,0.2664017677307129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,7168,0.354003561867608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,4096,0.10946666532092625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,6144,0.30032266510857475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,5120,0.2153244415918986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,3584,0.09639644622802734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,4096,0.17464089393615723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,5120,0.265209780799018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,4096,0.2062995566262139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,3072,0.08375110891130234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,65536,3.152616924709744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,3584,0.15074843830532497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,3584,0.18554755051930746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,2048,0.05352888835801018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,3072,0.13329688707987467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,3072,0.16330488522847494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,2560,0.14198133680555555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,1536,0.04239999916818407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,2048,0.11726221773359512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,2048,0.09469333622190688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,1024,0.02868710954984029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,768,0.02312177750799391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,1536,0.07574311229917738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,1536,0.09763822290632461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,1024,0.07480000125037299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,512,0.018974221414989896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,1024,0.056622220410241016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,768,0.06320533487531874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,256,0.013895110951529609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,512,0.053575999206966825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,512,0.03779022230042352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,128,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,256,0.03105866577890184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,64,0.009983110758993361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,128,0.034232000509897866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,32,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,64,0.028390222125583228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,32,0.02809244394302368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,8192,2560,0.06935111019346449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,2560,0.1169475581910875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,768,0.045639998382992215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,8192,256,0.04080977704789903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,8192,128,0.028520888752407495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,51200,1.0489920510186088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,16384,0.3405333360036214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,65536,1.5977884928385417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,12288,0.2443244457244873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,16384,0.6475591129726833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,10240,0.2283733420901828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,12288,0.6301253106858995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,16384,0.7599289152357313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,12288,0.5819946924845377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,8192,0.1868248913023207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,10240,0.4239671230316162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,51200,2.28218142191569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,8192,0.3243937757280138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,7168,0.15388888782925075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,10240,0.4830177625020345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,6144,0.13146755430433485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,65536,3.024590174357096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,7168,0.28541866938273114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,8192,0.40123732884724933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,5120,0.11060088872909546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,6144,0.23940621482001412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,7168,0.33479823006523984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,4096,0.08897155523300171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,6144,0.30102488729688853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,5120,0.19724622037675646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,3584,0.07822933461931017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,5120,0.2431431081559923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,4096,0.157261331876119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,3072,0.07173333565394084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,4096,0.19576088587443033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,51200,2.301961686876085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,2560,0.05537333422236972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,3584,0.14201777511172825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,3584,0.17529688941107857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,2048,0.04620000057750278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,65536,2.9374622768825955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,3072,0.15393955177730984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,1536,0.03597866826587253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,2560,0.10623021920522054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,1024,0.025776889589097764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,2560,0.1334773302078247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,2048,0.11260444588131374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,2048,0.0901048911942376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,768,0.01999288962946998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,1536,0.09165244632297093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,1536,0.06986755794949003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,1024,0.05242933498488533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,1024,0.07505777809354994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,512,0.01556799974706438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,256,0.012472000386979846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,768,0.04319999946488274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,768,0.060255997710757785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,128,0.011052444577217102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,512,0.05122933453983731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,512,0.035056889057159424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,256,0.02791822287771437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,256,0.04155110981729295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,64,0.009691555466916826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,7168,32,0.009929777847396003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,7168,128,0.032568001084857516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,128,0.026720888084835474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,64,0.02624977793958452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,32,0.026385777526431616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,7168,3072,0.12440710597568089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,51200,0.9248551262749566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,16384,0.3303617901272244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,65536,1.2213848961724174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,12288,0.2574480109744602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,16384,0.6132355795966254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,16384,0.7077395651075574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,12288,0.4756808810763889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,51200,2.1036995781792536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,10240,0.21937867005666098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,8192,0.1730933321846856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,12288,0.5380151006910536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,10240,0.3816595607333713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,8192,0.3052906725141737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,7168,0.15443378024631077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,65536,2.7177520328097873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,10240,0.4504373338487413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,6144,0.12865244017706975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,7168,0.2608293427361382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,5120,0.10313955280515884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,8192,0.3790586789449056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,6144,0.2302044497595893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,7168,0.3189306788974338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,4096,0.08461688624487983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,6144,0.27186666594611275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,5120,0.18058755662706164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,3584,0.07201155689027575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,3072,0.06268533070882161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,4096,0.1463093360265096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,3584,0.12758310635884604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,3584,0.16564267211490208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,65536,2.7782372368706594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,2560,0.052468445565965444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,3072,0.11418044567108154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,3072,0.14779555797576904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,2048,0.04313155677583483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,1536,0.034310221672058105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,2560,0.09813866350385879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,2560,0.12687555948893228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,2048,0.10737244288126628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,2048,0.08131200075149536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,1024,0.025459556115998164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,1536,0.06423466735415988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,768,0.020427554845809937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,1536,0.08657333585951064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,512,0.018056000272432964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,1024,0.04818488823042976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,51200,2.177767011854384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,768,0.057321780257754855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,768,0.038889778984917536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,256,0.014206222361988492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,128,0.012496000362767113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,512,0.04936888813972473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,256,0.03735111157099406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,256,0.026105778084860906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,64,0.01146133326821857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,6144,32,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,128,0.03185955683390299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,128,0.02440533373090956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,64,0.024433778391944036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,5120,0.24598222308688691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,32,0.02403822210099962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,4096,0.18686132960849336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,6144,1024,0.06824088758892484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,51200,0.7123386594984266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,6144,512,0.032107555203967623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,65536,1.1189813613891602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,16384,0.27099643813239205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,12288,0.23083554373847115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,16384,0.5824382040235732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,12288,0.4189617898729112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,10240,0.15447733137342665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,16384,0.6689039866129557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,51200,1.8798792097303603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,12288,0.6428062121073405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,10240,0.4285786681705051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,8192,0.2774924437204997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,7168,0.1133413314819336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,8192,0.35044177373250324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,51200,2.051323572794596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,7168,0.2422720061408149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,6144,0.102000892162323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,7168,0.30345243877834743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,65536,2.6198461320665145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,5120,0.08787111441294353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,6144,0.25807378027174205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,10240,0.34597155782911515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,4096,0.06788000133302477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,5120,0.16600799560546875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,4096,0.13350221845838758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,4096,0.17700889375474718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,3584,0.06065333551830716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,65536,2.4736124674479165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,3072,0.054655998945236206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,3584,0.11825777424706353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,3584,0.15773599677615696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,2560,0.04337155487802294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,3072,0.1034311122364468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,3072,0.13845333788130018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,2048,0.03346044487423367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,2560,0.08819733063379924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,2560,0.11905866199069554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,1536,0.02738222148683336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,2048,0.10170311397976345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,1024,0.02040799955526988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,6144,0.20327111085255942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,1536,0.05792533026801216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,1536,0.08234400219387479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,768,0.015978667471143935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,1024,0.043904887305365674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,1024,0.0648204419347975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,8192,0.14510044786665174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,512,0.01239733315176434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,768,0.055325332615110606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,768,0.035601778162850276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,256,0.009639999932712978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,128,0.008691555923885768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,512,0.045428444941838585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,512,0.029538667864269678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,256,0.03617777758174472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,256,0.02423288921515147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,32,0.009648000200589498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,128,0.030586666531032983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,64,0.022299556268586054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,32,0.02199733257293701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,2048,0.0747893320189582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,65536,0.9127848943074545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,5120,64,0.00928177767329746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,5120,128,0.02240266733699375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,51200,0.7650782267252604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,16384,0.23108355204264322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,12288,0.18295910623338488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,16384,0.4979697863260905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,12288,0.37448978424072266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,16384,0.6618053118387858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,65536,2.10775015089247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,10240,0.14338844352298313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,5120,5120,0.21579110622406006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,12288,0.47921334372626406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,8192,0.11727110544840495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,7168,0.10597778028912014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,10240,0.317230224609375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,51200,1.6654604805840387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,8192,0.25092000431484646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,10240,0.40500532256232363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,6144,0.08618044190936619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,8192,0.3264888922373454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,7168,0.21955645084381104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,5120,0.07683910926183064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,7168,0.28408532672458225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,4096,0.061327113045586475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,65536,2.459120856391059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,6144,0.18422933419545492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,6144,0.24335198932223848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,5120,0.15084621641370985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,3584,0.053779555691613086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,5120,0.203658660252889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,51200,1.9231253729926214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,3072,0.04491110973887973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,4096,0.12211199601491292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,4096,0.1670302285088433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,2560,0.03743199838532342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,3584,0.1078195571899414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,2048,0.03090488910675049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,3584,0.14869956175486246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,3072,0.09490311145782471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,3072,0.13031555546654597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,2560,0.11318311426374648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,1024,0.018274666534529794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,2048,0.09538755814234416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,2048,0.06541777981652154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,768,0.014669333895047506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,1536,0.05293955405553182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,1536,0.07823822233412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,1024,0.06099377738104927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,512,0.011762667033407422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,1024,0.04012889001104567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,256,0.009022222624884712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,768,0.03237066666285197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,768,0.051817778084013194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,128,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,512,0.0424542228380839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,256,0.02198311189810435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,256,0.033724443780051336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,64,0.008294222255547842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,128,0.02035999960369534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,4096,128,0.029145777225494385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,32,0.0086986662613021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,64,0.020484444167878892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,32,0.01995466649532318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,4096,1536,0.024412444896168176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,65536,0.6749217775132922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,2560,0.08011200030644734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,51200,0.5304880142211914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,16384,0.17844800154368082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,4096,512,0.02642222245534261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,12288,0.13880088594224718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,16384,0.4947795338100857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,16384,0.5975688828362359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,10240,0.11997332837846543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,12288,0.45781776640150285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,65536,1.9914480845133464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,8192,0.09634133179982503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,10240,0.2982470989227295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,51200,1.5630648930867512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,7168,0.0808053347799513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,8192,0.23834310637580025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,8192,0.3087493313683404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,7168,0.20834488338894316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,6144,0.07160711288452148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,65536,2.313873714870877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,7168,0.2687857680850559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,12288,0.3562942345937093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,5120,0.06080977784262764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,51200,1.8196640014648438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,4096,0.046909332275390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,6144,0.17618132962120903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,6144,0.22910488976372612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,3584,0.04184800055291918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,5120,0.14407644006941053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,5120,0.19274044036865234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,4096,0.11626666122012669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,4096,0.1573866605758667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,3072,0.03503733211093479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,2560,0.02889333168665568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,3584,0.1028862198193868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,3584,0.140557328859965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,2048,0.02420177724626329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,3072,0.12347200181749131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,1536,0.019709333777427673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,2560,0.10676888624827068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,2560,0.07648444175720215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,1024,0.014852444330851236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,2048,0.09051644139819676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,2048,0.06174577607048882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,768,0.012257777982287936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,10240,0.38263466623094344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,1536,0.05003822180959913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,512,0.009663110805882348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,1024,0.03821333249409994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,768,0.03122666809293959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,768,0.047930667797724404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,512,0.04138488901986016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,512,0.02590755621592204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,128,0.006953777538405524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,256,0.033519999848471746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,256,0.02085599965519375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,64,0.00628266649113761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,128,0.028894222444958154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,32,0.00657066661450598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,128,0.01960000064637926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,64,0.01921866668595208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,32,0.01905155513021681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,65536,0.5750533209906684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3584,3072,0.09023111396365696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,51200,0.4865440262688531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,1536,0.07403377691904704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3584,1024,0.05775022506713867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,16384,0.17569777700636122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3584,256,0.007266666326257918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,12288,0.13644622431861028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,16384,0.44649420844184023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,12288,0.33681334389580625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,10240,0.10684088865915935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,16384,0.5940577718946669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,12288,0.4721120198567708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,8192,0.08997955587175156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,10240,0.2827226585812039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,7168,0.07129066520267062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,65536,1.8945492638481989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,10240,0.3798497782813178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,8192,0.2289973364935981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,6144,0.06561866733762953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,8192,0.30760712093777126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,7168,0.19713866710662842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,5120,0.05654044283760918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,7168,0.2669546604156494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,6144,0.16759199566311309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,4096,0.04359022114011976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,6144,0.2283866670396593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,5120,0.13635910881890193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,5120,0.1912026670244005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,3584,0.03808177842034234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,4096,0.10940888855192397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,4096,0.15585688749949136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,51200,1.8037662506103516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,3072,0.03398222062322829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,65536,2.3047031826443143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,3584,0.1398844454023573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,3584,0.0972213347752889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,2048,0.02479377720091078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,3072,0.0850142240524292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,2560,0.07187555233637492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,2560,0.10578311151928371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,1536,0.020077332854270935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,2048,0.060119999779595264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,2048,0.08973511060078938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,1024,0.015014222926563688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,1536,0.046499556965298124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,1536,0.0731368859608968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,768,0.012100444071822695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,1024,0.057124442524380155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,1024,0.035818666219711304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,51200,1.48016177283393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,512,0.010010666317409938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,768,0.029509332444932725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,768,0.04761155446370443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,512,0.024479111035664875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,512,0.04039288891686334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,128,0.006692444284756978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,256,0.032131556007597185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,256,0.019926221834288705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,64,0.006576889091067844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,32,0.006581333362393909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,128,0.027280888623661462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,128,0.018564444449212816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,64,0.01819022165404426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,3072,32,0.018187556001875136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,2560,0.029280887709723577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,3072,3072,0.12237689230177139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,65536,0.5110630989074707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,51200,0.42479289902581113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,16384,0.14383910761939153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,3072,256,0.007655111451943715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,12288,0.10550666517681545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,16384,0.45314402050442165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,16384,0.5854826503329807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,12288,0.31891022788153756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,10240,0.09590222438176473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,12288,0.430039988623725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,51200,1.3695075776841905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,8192,0.07342488898171319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,65536,1.7505227194892035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,10240,0.2668631076812744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,7168,0.06213421954049004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,8192,0.21495644251505533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,10240,0.35880443784925675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,6144,0.05104177859094408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,8192,0.28995733790927464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,7168,0.1866462230682373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,5120,0.04467199908362495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,7168,0.2517813311682807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,51200,1.6945635477701824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,4096,0.03446311089727614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,6144,0.157587554719713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,3584,0.03081866767671373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,6144,0.21352710988786486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,5120,0.128985775841607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,5120,0.1799751122792562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,3072,0.02756533357832167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,65536,2.1633964114718967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,4096,0.10365688800811768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,4096,0.1471173365910848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,2560,0.023062222533755835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,3584,0.13202755981021458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,2048,0.020061333974202473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,3072,0.08116888999938965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,3072,0.11579467190636529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,2560,0.1003991100523207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,2560,0.06913066572613187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,2048,0.05613599883185493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,2048,0.08476533492406209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,1024,0.011382222175598145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,768,0.009879111415810054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,1536,0.06936888562308417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,1536,0.04349955585267809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,512,0.007780444290902879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,1024,0.054719110329945884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,1024,0.03329599897066752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,768,0.02747822304566701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,256,0.006286222073766921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,768,0.04491733180152046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,128,0.0058346668051348785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,512,0.02299733294381036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,512,0.039749334255854286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,256,0.018927110566033255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,256,0.03138755427466498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,128,0.01755288905567593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,32,0.005254222287072076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,64,0.017200888858901132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,32,0.017122666041056316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,65536,0.48280175526936847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2560,3584,0.09193511141671075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,1536,0.01605599953068627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,51200,0.39812800619337296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,16384,0.1419644488228692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2560,64,0.0052168890833854675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2560,128,0.027016000615225896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,12288,0.0913519991768731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,16384,0.43036890029907227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,65536,1.5804177390204535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,12288,0.30072887738545734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,10240,0.07147555881076388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,16384,0.5556293593512641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,51200,1.237703111436632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,8192,0.05963999695248074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,10240,0.2521786689758301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,12288,0.42708444595336914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,8192,0.20248799853854707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,7168,0.05099911159939236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,6144,0.04200889004601372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,10240,0.3547831111484104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,8192,0.2887270980411106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,5120,0.036552889479531184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,7168,0.17775021659003365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,65536,2.1481058332655167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,7168,0.2498879962497287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,6144,0.14854133129119873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,4096,0.029156443145540025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,6144,0.21231467194027373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,3584,0.026909333136346605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,5120,0.12179466088612874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,5120,0.17825599511464438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,3072,0.02296177711751726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,4096,0.09814221991433038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,4096,0.14578933186001247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,3584,0.13042578432295057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,2560,0.0195768889453676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,2048,0.017260443833139207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,3072,0.11474843819936116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,3072,0.07557244433297051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,1536,0.013590222431553734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,2560,0.06482133600446913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,2560,0.09932977623409694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,2048,0.05254400107595655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,2048,0.08438222275839911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,1536,0.04100177685419718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,1536,0.06825511323081122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,768,0.008584889272848764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,1024,0.05266133281919691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,512,0.00723555518521203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,768,0.0259244441986084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,768,0.04454311066203647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,256,0.005960000058015187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,512,0.021643555826610986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,512,0.038507554266187884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,128,0.00565244464410676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,256,0.01756177842617035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,256,0.030807110998365615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,64,0.005600000007285013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,128,0.016255110502243042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,128,0.026399999856948853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,2048,51200,1.6834399965074327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,64,0.01620444489849938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,32,0.015805333852767944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,3584,0.08736888567606609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,65536,0.3260062270694309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,51200,0.25557510058085126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,16384,0.09142844544516669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,1024,0.010375111467308467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,2048,1024,0.03122933374510871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,12288,0.05995644463433159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,16384,0.3872533374362522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,16384,0.5197751257154677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,2048,32,0.005567111074924469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,12288,0.2848275502522786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,10240,0.054570668273501925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,8192,0.04282844397756788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,51200,1.1559040281507704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,12288,0.3995173242357042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,65536,1.4814204110039606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,10240,0.2388231224483914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,7168,0.038479109605153404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,8192,0.19195289081997344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,7168,0.16699555185106066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,7168,0.23441688219706217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,6144,0.14071288373735216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,5120,0.02748888896571265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,51200,1.5788710912068684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,6144,0.1994382275475396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,4096,0.021874666213989258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,5120,0.11446577972835964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,5120,0.16742755307091606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,65536,2.0083395640055337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,3584,0.020302222834693063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,3072,0.017237333787812125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,4096,0.13690666357676187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,3584,0.08129422532187568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,3584,0.12220711178249782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,2560,0.015562666787041558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,3072,0.07116266753938463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,3072,0.10771911011801825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,2048,0.013185777597957186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,2560,0.09366222222646077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,2048,0.04908711049291822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,6144,0.032109333409203425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,1536,0.010602666272057427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,2048,0.07957333326339722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,1024,0.00889955543809467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,1536,0.037971556186676025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,8192,0.2697262234157986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,768,0.007679111427730984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,1024,0.029577778445349798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,1024,0.04948711064126757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,512,0.006587555425034628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,768,0.04246933261553446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,768,0.024511110451486375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,256,0.0052577778697013855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,512,0.020592000749376085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,512,0.03663555449909634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,128,0.004559111264016894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,4096,0.09195199939939712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,256,0.029426667425367568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,64,0.004234666625658671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,128,0.015207999282413058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,128,0.025157334076033697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1536,32,0.004513777792453766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,64,0.014801777071423002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,32,0.01482311056719886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,65536,0.2354666656917996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,10240,0.33304089970058864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,51200,0.18956266509162056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1536,1536,0.06466399961047702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,16384,0.0657164454460144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,256,0.016789333687888253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,16384,0.353312889734904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,12288,0.04554133282767402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1536,2560,0.06015288829803467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,51200,1.0797395706176758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,65536,1.3796951505872939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,10240,0.03990488913324144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,16384,0.515392886267768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,8192,0.03126400046878391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,10240,0.2248631053500705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,12288,0.39206756485833066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,10240,0.3303866651323107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,7168,0.027637332677841187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,8192,0.18016000588734946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,6144,0.02330044408639272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,51200,1.5676097869873047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,5120,0.020074667202101815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,65536,1.9948702918158636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,7168,0.23257154888576934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,6144,0.19835289319356283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,4096,0.017098666893111337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,5120,0.10707377725177342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,5120,0.16631910536024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,3584,0.015169777803950839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,4096,0.08627111381954616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,4096,0.13577422830793592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,3072,0.013653332988421122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,3584,0.12189422713385688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,3584,0.07646399736404419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,2560,0.011911110745535957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,3072,0.06670666403240628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,3072,0.1067919996049669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,2048,0.010113777385817634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,2560,0.05585866504245334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,2560,0.09285155269834731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,1536,0.00867022242810991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,2048,0.04513511061668396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,1024,0.0069360000391801195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,1536,0.03531288769510057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,1536,0.062236441506279834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,768,0.005955555372767978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,1024,0.02753066685464647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,1024,0.04912622107399834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,7168,0.15644889407687718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,512,0.005264889034960005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,768,0.04227022329966227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,6144,0.13205777274237737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,256,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,512,0.03605066736539205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,512,0.019575110740131803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,128,0.0041751112374994485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,256,0.02940444482697381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,256,0.015820443630218506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,64,0.004571555389298333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,1024,32,0.004600000050332812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,128,0.024738666084077623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,128,0.014352889524565803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,64,0.014120888378885059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,12288,0.26787466473049587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,32,0.013879111243618859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,65536,0.19217777252197266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,51200,0.14513866106669107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,16384,0.049788445234298706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,2048,0.07822133435143365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,16384,0.3419653309716119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,1024,8192,0.26867379082573783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,1024,768,0.023232888844278123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,12288,0.03797511259714762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,12288,0.2599742147657606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,51200,1.0435991287231445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,10240,0.029208001163270738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,16384,0.48102580176459414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,12288,0.3662835492028131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,8192,0.02479733361138238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,10240,0.21796266237894693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,7168,0.021734222769737244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,10240,0.3083679940965441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,8192,0.1748346620135837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,6144,0.019476445184813607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,51200,1.4557138019137914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,8192,0.25036711162990993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,5120,0.017039111918873258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,7168,0.15195733971065944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,7168,0.21733066770765516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,6144,0.12787644068400064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,65536,1.8526596493191188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,6144,0.18404444058736166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,4096,0.014874666929244995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,5120,0.10383022493786281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,3584,0.012871111432711283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,3072,0.01183733344078064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,4096,0.08297155300776164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,4096,0.12699822584788004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,3584,0.07390311029222277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,3584,0.11311911212073432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,2560,0.010069333016872406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,3072,0.06454310814539592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,2048,0.00868977771864997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,3072,0.09988888767030503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,2560,0.05351555678579542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,1536,0.007601777712504069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,2048,0.07237066825230916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,2048,0.043143110142813794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,65536,1.3338017993503148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,1024,0.006275555739800136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,768,0.005581333405441708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,1536,0.05854666895336575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,1536,0.03399822115898132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,1024,0.04624533322122362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,1024,0.026723555392689172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,512,0.004920000003443824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,768,0.022351110974947613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,256,0.004229333251714706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,768,0.03952177696757846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,128,0.003916444463862313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,512,0.0188719994492001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,256,0.014952888091405233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,256,0.027823110421498615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,128,0.023708444502618577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,32,0.003891555385457145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,64,0.01346933344999949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,32,0.01312355531586541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,65536,0.1486026710934109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,5120,0.1545271078745524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,51200,0.11770310666826035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,2560,0.08688177665074666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,16384,0.0381351113319397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,768,512,0.034597333934572004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,768,64,0.0035377778112888336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,768,128,0.013758222262064615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,16384,0.33185243606567383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,12288,0.02681688964366913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,10240,0.021976000732845728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,51200,1.01127380794949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,65536,1.2901795705159504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,8192,0.018716444571812946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,12288,0.2522275447845459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,10240,0.21096177895863852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,16384,0.4798409144083659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,12288,0.364682674407959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,7168,0.016926222377353244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,6144,0.014879110786649915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,10240,0.30694577429029674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,8192,0.16926933659447563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,5120,0.013134222063753339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,51200,1.4537848366631403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,8192,0.24972356690300834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,7168,0.1473333305782742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,6144,0.12384177578820123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,6144,0.18430488639407686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,5120,0.10042044189241196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,3584,0.010395555860466426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,5120,0.15425066153208414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,4096,0.1265582243601481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,3072,0.009359111388524374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,3584,0.07086666425069173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,3584,0.11318222681681316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,2560,0.008339555727110969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,3072,0.09976266490088569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,3072,0.06202844116422865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,2048,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,2560,0.051629334688186646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,1536,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,2048,0.04134933484925164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,2048,0.07172977924346924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,1536,0.032999111546410456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,1536,0.05820888943142361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,1024,0.005260444349712796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,1024,0.04601866669125027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,1024,0.025780444343884785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,768,0.004875555634498596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,7168,0.21687555313110352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,512,0.004506666627195147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,65536,1.8494372897677953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,4096,0.08021955357657538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,512,0.01829688913292355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,256,0.0038204445607132385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,512,0.03396888905101352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,128,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,256,0.02718933257791731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,256,0.014697778556081982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,64,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,128,0.013125333521101209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,128,0.023027555810080633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,32,0.003522666792074839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,2560,0.08632089032067193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,64,0.013186666700575085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,65536,0.08014221986134847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,32,0.012759110993809171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,51200,0.06532000170813666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,512,4096,0.01130488928821352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,512,768,0.03973866502443949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,512,768,0.021651556094487507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,16384,0.02546311087078518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,12288,0.02017511096265581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,16384,0.32110844718085396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,12288,0.2442693445417616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,10240,0.018762666318151686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,16384,0.47435734007093644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,65536,1.248744010925293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,8192,0.01611911091539595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,10240,0.20436978340148926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,12288,0.36134666866726345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,7168,0.013746666411558786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,8192,0.16396266884273952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,10240,0.3042302131652832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,6144,0.012820444173283048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,8192,0.24734576543172201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,7168,0.14255910449557835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,65536,1.8295519087049696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,5120,0.01090400003724628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,6144,0.12016177177429199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,4096,0.010022222167915767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,6144,0.18269599808586967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,5120,0.096833778752221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,5120,0.15290755695766872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,3584,0.007996444072988298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,4096,0.07786399788326688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,3072,0.0074648890230390764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,51200,0.9772888819376627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,4096,0.12480533123016357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,3584,0.06890310843785603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,3584,0.11167377895779079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,2560,0.006633777585294511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,3072,0.09806755516264175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,2560,0.049661331706576876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,2560,0.08534310923682319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,2048,0.0395671096112993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,1536,0.0052560000783867305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,1024,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,2048,0.07130133443408541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,1536,0.05713333023918999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,1536,0.03190133306715224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,51200,1.4354559580485027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,1024,0.045560889773898654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,1024,0.02502044373088413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,512,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,768,0.020957332518365648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,768,0.0387386679649353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,512,0.033942222595214844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,512,0.01789866718981001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,256,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,7168,0.2152737776438395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,128,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,64,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,256,0.013816888961527081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,256,0.027450667487250432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,32,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,256,128,0.02366399930583106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,64,0.012373333175977072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,32,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,51200,0.050491554869545825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,2048,0.00589155571328269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,256,768,0.003964444415436851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,16384,0.016973333226309884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,51200,0.9460026423136393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,128,0.01279022213485506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,65536,1.209887080722385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,12288,0.013172444370057849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,16384,0.3118231031629774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,65536,0.06241955359776815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,10240,0.012423999607563019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,12288,0.2369555632273356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,10240,0.19869511657290986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,256,3072,0.059792002042134605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,8192,0.011027555498811932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,12288,0.3606666723887126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,16384,0.47362576590643984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,10240,0.30390845404730904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,7168,0.010955555571450127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,6144,0.012431110772821637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,51200,1.4308666653103297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,65536,1.8281307220458984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,8192,0.15930577119191489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,5120,0.009763555394278632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,8192,0.24696977933247885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,7168,0.13845600022210017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,7168,0.21426222059461805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,4096,0.00832622249921163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,6144,0.11589511235555013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,3584,0.007651555869314406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,6144,0.1818924480014377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,5120,0.09383644660313924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,5120,0.15236000219980875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,4096,0.07488622268040974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,3072,0.007266666326257918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,4096,0.12469866540696885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,3584,0.11148444811503093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,3584,0.06658666663699679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,3072,0.057167112827301025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,2048,0.005868444426192178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,3072,0.0979893340004815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,2560,0.047079109483295016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,1536,0.004888888862397936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,2560,0.08367821905348037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,1024,0.004230222354332606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,2048,0.03771555423736572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,2048,0.07283377647399902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,768,0.003912000192536248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,1536,0.03083733386463589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,1536,0.056813332769605845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,1024,0.04554133282767402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,512,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,1024,0.024380443824662104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,256,0.0033475555893447665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,768,0.038718223571777344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,768,0.020534222324689228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,128,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,512,0.03390399946106805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,512,0.017176000608338248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,64,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,32,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,128,0.022279111875428095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,128,0.012518222133318583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,64,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,65536,0.05953422519895765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,32,0.012080888781282636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,51200,0.04775999983151754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,16384,0.019351111518012155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,12288,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,16384,0.3113208876715766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,10240,0.010689777632554373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,12288,0.2365973260667589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,8192,0.009705777797434065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,10240,0.1979831059773763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,8192,0.15890133380889893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,7168,0.009211555951171452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,6144,0.008672888908121321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,51200,0.9473075866699219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,5120,0.008639111287064022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2560,128,256,0.026382222771644592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,4096,0.007646222081449296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,65536,1.2094586690266926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,6144,0.11610578166113959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,3584,0.006962666908899943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,5120,0.09342222081290351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,3072,0.006578666468461354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,4096,0.07507999738057454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,2560,0.005948444621430502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,2048,0.005215999980767568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,3584,0.06593333350287543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,1536,0.004881777697139316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,3072,0.05727466609742907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,2560,0.047205332252714366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,1024,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,2048,0.038322667280832924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,768,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,512,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,128,2560,0.006603555546866522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,1536,0.030974222554100886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,1024,0.02419288953145345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,128,0.0029057777590221832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,768,0.02029511166943444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,64,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,512,0.01724444495307075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,32,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,256,0.013527111046844058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,65536,0.057596445083618164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,128,0.012114666402339935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,64,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,32,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,51200,0.046647111574808754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,16384,0.013073777986897362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,12288,0.010446222292052375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,128,256,0.013626666532622443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,10240,0.009542221824328104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,64,7168,0.13806222544776067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,16384,0.31170932451883954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,8192,0.008345777789751688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,7168,0.008302222523424361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,10240,0.1982088883717855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,8192,0.15889599588182238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,6144,0.007947555846638149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,5120,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,7168,0.13780089219411215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,4096,0.007988444632954067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,64,256,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,51200,0.9466799630059136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,3584,0.0070462218589252895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,6144,0.11572710673014323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,5120,0.0929751131269667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,2560,0.005928888916969299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,4096,0.07482755846447416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,65536,1.20869869656033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,3584,0.06588888830608793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,3072,0.057108441988627114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,1536,0.004507555729813046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,1024,0.003826666623353958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,2560,0.04695822132958306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,768,0.0038293335172865125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,2048,0.03934489025010003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,512,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,1024,0.02404266595840454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,256,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,768,0.020573332905769348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,128,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,512,0.01722133325205909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,12288,0.2364764478471544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,64,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,32,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,256,0.013418667018413544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,128,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,64,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,32,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,3072,0.006520000182920032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2560,32,2048,0.0052737775776121355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2560,32,1536,0.030664887693193223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,12288,2.3170293172200522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,10240,2.100249820285373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,16384,3.0792772505018444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,12288,2.53769768608941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,16384,3.593176947699653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,10240,2.118760002983941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,8192,1.5666862063937719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,7168,1.3589742448594835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,7168,1.3913022147284613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,8192,1.641856935289171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,6144,1.1519467035929363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,5120,0.9104177686903211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,4096,0.689144876268175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,6144,1.1908213297526042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,3584,0.6789057519700793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,4096,0.7675129042731391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,5120,1.0023555755615234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,3072,0.5417484707302517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,2048,0.35245511266920304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,2560,0.4841849009195964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,3072,0.5920320087009007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,3584,0.7420550982157389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,2560,0.505209763844808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,1536,0.28080799844529897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,1024,0.22902401288350424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,768,0.16477866967519125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,1024,0.25363466474745006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,2048,0.4485795762803819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,512,0.12673778004116482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,256,0.08681688706080119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,128,0.07265422079298231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,1536,0.434911118613349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,768,0.23090222146775988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,512,0.16917955875396729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,64,0.06647911336686876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,256,0.1526764498816596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,32,0.07402666409810384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,128,0.143251551522149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,64,0.18031644821166992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,32,0.1431164476606581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,16384,2.370652516682943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,65536,51200,9.868025885687933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,16384,2.8067796495225696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,12288,1.749339527553982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,10240,1.461814244588216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,12288,2.0287867652045355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,8192,1.1830231348673503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,10240,1.653178638882107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,8192,1.3109315236409504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,7168,1.0371298260158963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,65536,51200,14.331720987955729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,51200,7.308876037597656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,7168,1.1030808554755318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,6144,0.926513777838813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,4096,0.5824542045593262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,6144,0.9723013771904839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,4096,0.6732524236043295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,5120,0.791794670952691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,3584,0.5542764663696289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,3584,0.5431369145711263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,3072,0.4482977655198839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,2560,0.3915484481387668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,3072,0.5047698020935059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,5120,0.8696995311313205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,65536,9.459829542371962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,2560,0.43084534009297687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,2048,0.3252951039208306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,1536,0.24227733082241484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,1024,0.17082133558061388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,768,0.13440177175733778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,2048,0.3362373246086969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,1024,0.23639199468824598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,512,0.09894755813810562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,256,0.0819715526368883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,768,0.16320266988542345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,512,0.13590666982862684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,1536,0.28720177544487846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,128,0.05762933360205757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,256,0.12081066767374675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,32,0.056851552592383496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,128,0.11474133862389459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,64,0.11522755357954238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,32,0.1149173312717014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,51200,11.120407104492188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,51200,64,0.05433511071734958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,16384,0.7943289015028211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,16384,1.0421661800808377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,12288,0.7994906637403699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,10240,0.46645424101087785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,51200,2.4417173597547746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,8192,0.41667821672227645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,10240,0.6380506621466743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,65536,3.1421288384331594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,12288,0.6092391014099121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,8192,0.5185039838155111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,7168,0.35609955257839626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,5120,0.21730400456322563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,7168,0.4352293279435899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,6144,0.29278932677374947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,6144,0.3653262191348606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,4096,0.1750488943523831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,5120,0.34848801294962567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,3584,0.16165867116716173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,3072,0.13339911566840276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,4096,0.2442915439605713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,2560,0.11785156197018093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,3584,0.21572444174024794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,2048,0.09727111127641465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,3072,0.1955475542280409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,1536,0.07527466615041097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,51200,65536,14.501859876844618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,2048,0.14050132698482937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,2560,0.16826044188605416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,768,0.04530133472548591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,1536,0.10732266638014053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,256,0.02426044477356805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,1024,0.08142933580610487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,51200,4.021814134385851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,512,0.05911111169391208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,64,0.018057778477668762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,256,0.048694223165512085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,32,0.01779111060831282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,128,0.048673778772354126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,64,0.047037333250045776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,32,0.04474488894144694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,65536,4.742013295491536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,1024,0.051628443929884166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,512,0.031786666976081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,16384,768,0.06914489136801825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,16384,128,0.02029333346419864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,16384,0.5141608979966905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,12288,0.4125813378228082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,10240,0.37180177370707196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,12288,0.6087830861409506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,16384,0.8363031281365289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,8192,0.2902257707383898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,7168,0.23650312423706055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,10240,0.5425217946370443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,8192,0.40387643708123105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,6144,0.1988124450047811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,65536,2.524200015597873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,5120,0.17987110879686144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,6144,0.3054551018608941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,7168,0.3706764380137126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,5120,0.2521759933895535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,4096,0.15336978435516357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,3584,0.12620088789198133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,4096,0.20027466615041098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,2560,0.09200621975792779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,3072,0.10161688592698838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,3584,0.18274845017327201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,2048,0.07902222209506564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,1536,0.05691288577185737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,3072,0.16716178258260092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,1024,0.04091555542416043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,2560,0.13391466935475668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,768,0.03346666693687439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,2048,0.11139021979437934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,512,0.024318221542570326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,1536,0.08915199836095174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,1024,0.0695528917842441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,256,0.019582221905390423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,768,0.054302222198910184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,128,0.015554666519165039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,64,0.01351999988158544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,51200,2.016632080078125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,512,0.044567998912599355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,12288,32,0.013411555853154926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,256,0.0388408899307251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,64,0.03463644451565213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,32,0.034309334225124784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,65536,4.084401024712457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,16384,0.41539200146993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,51200,3.073752933078342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,12288,128,0.0362115568584866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,12288,0.33795465363396543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,51200,1.4755058288574219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,65536,1.8379279242621527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,10240,0.28609689076741535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,12288,0.5400702158610026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,8192,0.24426399336920845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,10240,0.49910932117038304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,7168,0.205295999844869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,16384,0.7631502151489258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,8192,0.3757528993818495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,6144,0.17620978090498182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,5120,0.15175288253360325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,4096,0.11770844459533691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,6144,0.2647724416520861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,7168,0.34499467743767637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,3584,0.10551644696129693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,5120,0.2212675544950697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,4096,0.19120889239841035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,3072,0.08863555722766453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,51200,2.610989252726237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,2560,0.0750017762184143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,2048,0.06573155853483412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,3584,0.1583484411239624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,1536,0.048488888475630015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,1024,0.03384800089730157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,3072,0.15245155493418375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,2560,0.12128178278605144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,2048,0.10115733411577012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,1536,0.07999022139443292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,512,0.028006222512986925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,256,0.022224000758594934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,768,0.04989599850442675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,128,0.013743110828929476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,512,0.03939111034075419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,1024,0.059416890144348145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,64,0.012560000022252401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,256,0.033597333563698664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,32,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,128,0.031215998861524794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,64,0.03094666533999973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,32,0.030729777283138696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,10240,65536,3.5147342681884766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,12288,0.2824195490943061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,16384,0.6319866710238987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,10240,768,0.03116977877087063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,10240,0.24702400631374785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,51200,1.1625315348307292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,8192,0.1924142175250583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,65536,1.4834764268663194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,10240,0.39514578713311094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,7168,0.16543644004397923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,6144,0.15703022480010986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,8192,0.3619111114078098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,5120,0.128440883424547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,16384,0.37263554996914333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,7168,0.3150257799360487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,4096,0.10038399696350098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,6144,0.23457778824700248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,3584,0.09070399734708999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,5120,0.20503911707136366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,3072,0.0785155561235216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,4096,0.15523466798994276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,2560,0.06613510847091675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,3584,0.1429706679450141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,3072,0.12437600559658474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,1536,0.041356444358825684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,2560,0.10662844445970322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,1024,0.029631111356947158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,2048,0.08843911356396145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,768,0.022056000100241765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,12288,0.5158098008897569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,512,0.017972444494565327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,1536,0.07039822472466363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,1024,0.05158933334880405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,768,0.04340622160169813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,128,0.011986666255527072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,512,0.03420622150103251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,64,0.01033866653839747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,256,0.02882844540807936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,128,0.027448000179396734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,64,0.027101332942644756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,32,0.027133334014150832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,65536,3.0254792107476125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,2048,0.05169688993030124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,8192,51200,2.3215067121717667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,256,0.014293332894643148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,8192,32,0.010751999914646149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,16384,0.3234648969438341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,12288,0.23845511012607148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,16384,0.5857537587483724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,10240,0.1998657782872518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,12288,0.4469617737664117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,8192,0.1653333372539944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,7168,0.14548177189297146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,10240,0.3671297762129042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,8192,0.295909325281779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,6144,0.1232080062230428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,5120,0.10874399873945449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,7168,0.2711084418826633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,51200,1.0147519641452365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,6144,0.21604177686903211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,4096,0.0828275548087226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,3584,0.0734835531976488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,5120,0.1831208864847819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,3072,0.06337155236138238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,65536,2.7191280788845487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,2560,0.054303109645843506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,4096,0.1428604390886095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,3584,0.12960978349049887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,2048,0.04401333464516533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,1536,0.03382933470937941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,3072,0.11475377612643772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,1024,0.023539554741647508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,2560,0.1023484468460083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,2048,0.08096444606781006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,768,0.019080888893869188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,1536,0.06441244151857164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,512,0.014857777290874057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,256,0.011692444483439127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,1024,0.04816177818510267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,128,0.010335110955768162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,768,0.04228711128234863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,64,0.008963555925422246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,512,0.03188800149493747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,32,0.00923999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,256,0.026586666703224182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,128,0.025428444147109985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,64,0.025553777813911438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,32,0.02531288895342085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,7168,65536,1.3158551322089302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,16384,0.27383377816942006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,7168,51200,2.0320061577690973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,12288,0.20788889461093477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,16384,0.5391679869757758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,10240,0.1803306606080797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,12288,0.41045334604051376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,8192,0.14305867089165583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,51200,0.9238871468438042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,7168,0.12320444318983291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,65536,1.1785377926296658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,10240,0.3422657648722331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,6144,0.1345368888643053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,8192,0.2710239887237549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,5120,0.10619733068678115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,7168,0.2351920074886746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,4096,0.09131733576456706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,3584,0.07877066400316027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,6144,0.20325777265760633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,3072,0.07233866718080309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,5120,0.16560178332858616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,2560,0.04609244399600559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,2048,0.03706399930848016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,3584,0.11849421925014919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,1536,0.028654221031400893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,1024,0.020888888173633154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,3072,0.137119107776218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,2560,0.11703733603159587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,768,0.023912888434198167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,2048,0.07545333438449435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,512,0.017649778061442904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,1536,0.058957331710391574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,256,0.012992888689041138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,1024,0.044375999106301196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,128,0.010052444206343757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,768,0.04977866676118639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,64,0.008966222405433655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,512,0.029508444997999404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,6144,32,0.009143110778596666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,256,0.024675556355052527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,128,0.023367111881573994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,51200,1.9141563839382594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,64,0.028417779339684382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,32,0.022974222898483276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,65536,2.408067491319444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,16384,0.2817048761579725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,12288,0.20531822575463188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,16384,0.4982008934020996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,6144,4096,0.132877336608039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,51200,0.7988133430480957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,8192,0.12702400154537624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,12288,0.39509601063198513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,7168,0.11629245016309951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,65536,1.1434275309244792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,10240,0.3134702311621772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,6144,0.11224888430701362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,7168,0.21860622035132515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,5120,0.0959742201699151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,6144,0.18361511495378283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,4096,0.07798844575881958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,5120,0.1515680021709866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,3584,0.06935999790827434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,3072,0.06063377857208252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,51200,1.6971466276380751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,3584,0.10903555817074245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,2560,0.04121689001719157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,3072,0.09888622495863174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,2048,0.03386488887998793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,1536,0.02716800073782603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,2560,0.08033066987991333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,10240,0.1695084439383613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,1024,0.019733332925372653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,65536,2.140221277872721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,2048,0.0693217780854967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,768,0.01591377788119846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,512,0.012301333248615265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,1536,0.05437155564626058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,256,0.012151999606026543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,1024,0.04019733270009359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,128,0.008286221987671321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,256,0.02300888962215847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,64,0.007631111476156447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,8192,0.2677511109246148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,5120,32,0.007755555212497711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,128,0.021663111117151048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,64,0.02162666618824005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,32,0.02126755482620663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,4096,0.12184711297353108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,16384,0.20555733309851754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,51200,0.5910711288452148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,65536,0.8356240060594348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,12288,0.16631555557250977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,10240,0.13627910614013672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,512,0.027121777335802715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,8192,0.1107591125700209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,16384,0.453363577524821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,12288,0.35862488216824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,7168,0.09676622019873725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,10240,0.286265770594279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,6144,0.0744204454951816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,5120,0.064246224032508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,8192,0.22796355353461373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,4096,0.05074755681885613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,7168,0.1978213389714559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,3584,0.04411377840571933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,6144,0.20040267043643525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,3072,0.03779822256830003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,4096,0.1112168894873725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,51200,1.5129138098822699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,3584,0.09888711240556504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,2048,0.027525333894623652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,1536,0.022296888960732356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,3072,0.10323555601967706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,1024,0.018034666776657104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,2560,0.07268533441755506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,2048,0.05962844689687093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,768,0.014670222997665405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,512,0.0116462219092581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,1536,0.04897511005401611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,256,0.009007111191749573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,768,0.030993776188956365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,512,0.0247688889503479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,128,0.007261333366235097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,256,0.02075466679202186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,64,0.006259555617968242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,5120,768,0.03433600068092346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,32,0.006615110983451207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,128,0.01994400057527754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,64,0.01958044370015462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,32,0.019501333435376484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,5120,0.14054755369822183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,4096,2560,0.03240088952912225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,65536,0.6245822376675075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,51200,0.4845884641011556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,16384,0.1658737791909112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,12288,0.11938222249348958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,10240,0.11421688397725423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,65536,1.9250365363226996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,8192,0.09289689196480645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,4096,1024,0.036390221781200834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,7168,0.07607111003663805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,12288,0.344942225350274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,16384,0.4304995536804199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,6144,0.06748355759514703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,10240,0.2929768827226427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,8192,0.2157822185092502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,4096,0.045928001403808594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,7168,0.18763289186689588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,3584,0.039368887742360435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,6144,0.16302043861813015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,5120,0.14031110869513616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,3072,0.033598221010631986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,4096,0.10536977979871963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,2560,0.0303422212600708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,2048,0.025557332568698462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,3584,0.09400444560580784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,3072,0.08179644743601482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,51200,1.4100604587131078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,1536,0.019367110398080613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,2560,0.0704924464225769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,1024,0.014209777116775513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,768,0.012102222277058495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,512,0.009305777649084726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,2048,0.057539555761549205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,256,0.007599111232492659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,1024,0.03394844465785556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,768,0.02923733327123854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,512,0.023880889018376667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,256,0.020282665888468426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,64,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,128,0.018940443793932598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,64,0.01903022163444095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,32,0.018587556150224473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,5120,0.05612711111704508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,65536,0.5221155484517416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,51200,0.39586665895250106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,16384,0.13509155644310847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,1536,0.046295109722349376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,128,0.00657155571712388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,12288,0.10319555468029445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3584,32,0.006592888798978593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,10240,0.08864444494247437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,8192,0.07167288992140028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,16384,0.4225768778059218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,12288,0.3088231086730957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,7168,0.06707644462585449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,10240,0.25777777036031085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,6144,0.059902224275800914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,8192,0.20560977194044325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,5120,0.047820445564058095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,7168,0.17785688241322836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,4096,0.03838222225507101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,3584,0.036074668169021606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,6144,0.1502257717980279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,65536,1.6977163950602214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,5120,0.12452622254689534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,3072,0.028781334559122723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,4096,0.10019999742507935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,2560,0.02519911030928294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,2048,0.021470222208235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,51200,1.346475601196289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,3584,0.09048799673716228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,1536,0.01771377854877048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,1024,0.013239111337396832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,3072,0.0773528880543179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,2560,0.06726044416427612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,768,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,2048,0.05444622370931837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,512,0.009888889061080085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3584,65536,1.7963085174560547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,1024,0.03241599930657281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,256,0.007310222420427535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,768,0.028001778655582007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,512,0.022631110416518316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,32,0.005562666803598404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,256,0.018766222728623282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,128,0.017864889568752713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,64,0.017864889568752713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,32,0.017521777086787753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,51200,0.37176354726155597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,16384,0.13134311305152044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,12288,0.09518133269415961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,16384,0.4058409002092149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,3072,1536,0.043154666821161904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,128,0.005935110979610019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,8192,0.0709644423590766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,10240,0.24369422594706217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,7168,0.06074844466315376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,8192,0.1936968829896715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,65536,1.5877360237969294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,6144,0.05266844564014011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,65536,0.4827813572353787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,5120,0.04344444473584493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,7168,0.16873955726623535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,4096,0.03507288959291246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,6144,0.14140978124406603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,3584,0.0313991109530131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,3072,0.027306665976842243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,5120,0.11719555324978298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,4096,0.09438221984439427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,3584,0.0846337808503045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,3072,0.07436444362004598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,2048,0.020628444022602506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,1536,0.016688000824716356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,12288,0.29047377904256183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,2560,0.06345244248708089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,1024,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,3072,64,0.0052720002002186244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,10240,0.09029066562652588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,768,0.010378667049937779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,512,0.008294222255547842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,2048,0.05133600036303202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,1536,0.04009955459170871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,1024,0.030894223186704848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,768,0.026434666580624048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,512,0.02147377696302202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,128,0.005559999909665849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,256,0.018223111828168232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,51200,1.230804443359375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,64,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,32,0.005583999885453119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,128,0.017056889004177518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,64,0.016806221670574613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2560,32,0.016502221425374348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,16384,0.1093475553724501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,65536,0.38468000623914933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,51200,0.31431910726759166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,12288,0.08976978063583374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,10240,0.06241333484649658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,2560,0.02459022237194909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,8192,0.057887997892167836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,16384,0.3623333242204454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,12288,0.27357154422336155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,7168,0.044728888405693897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,6144,0.03741155399216546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,10240,0.24529777632819283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2560,256,0.006533333410819371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,7168,0.16165333324008518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,4096,0.026911111341582403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,51200,1.1223253673977323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,5120,0.11043555868996514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,3584,0.02404622236887614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,3072,0.021294222937689886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,4096,0.09269955423143174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,65536,1.4258382585313585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,2560,0.018848000301255118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,2048,0.016536888149049547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,3072,0.0691573354932997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,1536,0.012757333616415659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,2560,0.05897421969307793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,2048,0.04853066802024841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,1024,0.010142222046852112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,768,0.008657777474986183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,1536,0.037680887513690524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,512,0.007286222444640265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,1024,0.02882400155067444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,256,0.005892444401979446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,512,0.020131554868486192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,128,0.005250666704442766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,256,0.016873778568373788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,64,0.004612444589535396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,8192,0.18285155296325684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,32,0.0052266667286554975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,128,0.01614755557643043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,6144,0.13378489017486572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,64,0.01550222271018558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,32,0.015476443701320224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,65536,0.31636889775594074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,3584,0.08006044228871663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,16384,0.08076710833443536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,12288,0.060184889369540744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,16384,0.3390791151258681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,2048,768,0.02474222249454922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,12288,0.26680265532599556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,8192,0.03968977928161621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,7168,0.03481244378619724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,2048,5120,0.03417422374089559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,10240,0.21524977684020996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,51200,1.040769788953993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,6144,0.032820443312327065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,5120,0.028174221515655518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,4096,0.023108444280094568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,65536,1.3285129335191515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,6144,0.12458488676283096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,3584,0.02016799979739719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,5120,0.10315822230445014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,3072,0.01834133267402649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,51200,0.2368675602806939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,4096,0.08375910917917888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,3584,0.07448977894253202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,2048,0.013539555172125498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,1536,0.011123555401961008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,3072,0.06464622418085735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,1024,0.008958222137557136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,2560,0.05476444297366672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,768,0.00793333351612091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,2048,0.045046223534478076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,1536,0.035383111900753446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,512,0.00628355559375551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,1024,0.027419555518362258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,256,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,768,0.023494222097926672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,10240,0.04998222324583265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,128,0.004524444540341695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,512,0.01906133360332913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,64,0.0042035554846127825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,256,0.016197333733240765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,32,0.004565333326657613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,128,0.015182221929232279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,64,0.01512977812025282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,32,0.01455200049612257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,65536,0.2244675424363878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,51200,0.1720071103837755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,7168,0.14725600348578557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,12288,0.0432240002685123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1536,2560,0.016128889388508268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,10240,0.03990222348107232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,12288,0.23970754941304526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,8192,0.028751999139785767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,10240,0.20127288500467935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,51200,0.963814205593533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,7168,0.026268444127506677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,8192,0.16024443838331434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,6144,0.022738666998015508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,5120,0.019706666469573975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,65536,1.2301342222425673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,4096,0.016150222884284127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,7168,0.1378977828555637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,6144,0.11627644962734646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,3584,0.014168888330459595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,5120,0.09566844171947902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,16384,0.05594755543602837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1536,8192,0.17508355776468912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,2560,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,4096,0.07760444614622328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,2048,0.009767110976907942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,1536,0.007995555798212687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,3584,0.06934044758478801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,3072,0.060046222474839955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,2560,0.0502053333653344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,1024,0.006919999917348226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,768,0.005952000204059813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,512,0.00519822206762102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,1536,0.03271199928389655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,16384,0.31700889269510907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,1024,0.02534666657447815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,256,0.0041911109454101985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,768,0.021959111094474792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,128,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,64,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,512,0.017996443642510306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,32,0.0038737778862317405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,128,0.014109333356221518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,256,0.015159999330838522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,64,0.013806222213639153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,32,0.013739555246300168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,65536,0.16936088932885063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,51200,0.13511733214060465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,16384,0.04297511114014519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,12288,0.03641066617435879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,10240,0.029667556285858154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,16384,0.305456002553304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,8192,0.021838222940762837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,10240,0.1940577824910482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,1024,3072,0.012495111260149213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,7168,0.019877332780096266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,6144,0.017305778132544625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,8192,0.15450667010413274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,1024,2048,0.04123377799987793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,5120,0.015632000234391954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,6144,0.1117395559946696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,51200,0.9313457277086047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,3584,0.01204533295498954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,5120,0.09170844157536824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,65536,1.1870862113104927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,3072,0.011057777537239922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,2560,0.009909333454238044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,3584,0.06618222263124254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,2048,0.008341333104504479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,3072,0.05750222338570488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,2560,0.0482666658030616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,1536,0.007265778051482306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,1024,0.006280000011126201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,768,0.005321777943107817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,1024,0.024453333682484094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,12288,0.23183290163675943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,512,0.004872000051869286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,256,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,768,0.02130844526820713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,512,0.01756622228357527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,128,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,64,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,256,0.014517333772447375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,32,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,128,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,7168,0.13337688975863987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,64,0.01311644415060679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,768,4096,0.013356444736321768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,32,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,65536,0.13682488600413004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,51200,0.1051279968685574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,16384,0.035840001371171736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,12288,0.025736000802781846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,4096,0.07443200217352973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,10240,0.021879111727078755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,8192,0.017998221847746108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,16384,0.2949724462297228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,12288,0.22343201107449004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,7168,0.016185777054892648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,8192,0.149000883102417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,6144,0.01464355488618215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,5120,0.012439111040698158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,1536,0.031558222240871854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,7168,0.12891022364298502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,4096,0.011314666933483548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,6144,0.10752622286478679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,5120,0.08822933170530532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,3584,0.009537777966923183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,51200,0.8949271308051215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,3072,0.008655110994974772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,2560,0.00794666674402025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,4096,0.07136444250742595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,3584,0.06383377975887723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,2048,0.0069857777820693115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,65536,1.1401946809556749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,1536,0.005952888892756567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,3072,0.05484266744719612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,1024,0.004918222212129169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,768,0.00453599997692638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,2048,0.03761333227157593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,1536,0.030264000097910564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,1024,0.0236799998415841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,768,0.020358221398459542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,512,0.016879111528396606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,128,0.0032239999208185407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,256,0.013798221945762634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,64,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,10240,0.18697955873277453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,128,0.013193777865833707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,768,2048,0.03889688849449158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,32,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,64,0.012740444805887012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,65536,0.07589955462349786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,51200,0.06087733639611138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,32,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,16384,0.02130577796035343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,12288,0.018579555882347953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,16384,0.2835422092013889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,12288,0.21496444278293184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,10240,0.016347555650605094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,512,2560,0.045498665836122304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,8192,0.013579555683665805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,7168,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,512,0.0042133331298828125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,6144,0.01111288865407308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,512,256,0.003547555456558863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,10240,0.18008444044325086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,8192,0.14369244045681423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,5120,0.009678222239017487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,7168,0.1234275499979655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,3584,0.007840889195601145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,51200,0.8585404290093316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,3072,0.0070222218831380205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,5120,0.08470133278104995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,4096,0.06893955336676703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,65536,1.0936871634589302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,2560,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,3584,0.06123555368847317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,1536,0.0052062223354975385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,3072,0.05183022220929464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,1024,0.0041911109454101985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,2048,0.03656977746221755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,768,0.004011555678314633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,1536,0.0292559994591607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,512,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,1024,0.022661333282788593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,256,0.0035004446076022256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,768,0.0199608885579639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,128,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,512,0.01648622254530589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,64,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,256,0.013412444127930535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,32,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,128,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,64,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,65536,0.0584133333630032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,32,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,51200,0.04834666517045763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,16384,0.014761777387724983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,4096,0.008352888955010308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,12288,0.014152000347773233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,6144,0.10350133313073052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,10240,0.012503999802801343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,8192,0.01275466630856196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,256,2048,0.005579555614127054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,16384,0.28291556570265025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,7168,0.011583111352390714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,6144,0.010382222632567087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,256,2560,0.04384088847372267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,10240,0.18016089333428276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,5120,0.008982222113344405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,8192,0.14256532986958823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,4096,0.00796888851457172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,3584,0.0074142225914531285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,6144,0.10286666949590047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,5120,0.0837564468383789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,3072,0.006616000086069107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,51200,0.8568159739176432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,4096,0.0682248870531718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,2560,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,3584,0.06075555748409695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,2048,0.0052488889131281115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,1536,0.0048942222363419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,65536,1.0936844083997939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,3072,0.051161779297722705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,2560,0.04258044560750326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,1024,0.004184000194072723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,1536,0.02918222215440538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,768,0.0038328886859946777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,512,0.0034933334423436057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,1024,0.022647110952271357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,768,0.0196106665664249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,512,0.015835555063353646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,128,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,64,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,256,0.013074666261672974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,32,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,128,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,64,0.012111110819710625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,65536,0.05606310897403293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,32,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,51200,0.04576799935764737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,12288,0.21422221925523546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,16384,0.012621333201726278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,12288,0.013251555462678274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,7168,0.12332622210184734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,10240,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,16384,0.28257155418395996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,12288,0.21403022607167563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,8192,0.01038755559258991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,7168,0.009769777456919352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,10240,0.17951022254096138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,128,2048,0.035135110219319664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,6144,0.008957333034939235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,5120,0.009318222602208456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,128,256,0.003232888877391815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,7168,0.12247999509175618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,4096,0.00794933322403166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,51200,0.8561866548326281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,3584,0.007168889045715332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,6144,0.10302666823069255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,3072,0.006591111007663939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,2560,0.00628266649113761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,5120,0.08387644423378839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,65536,1.0933947033352323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,4096,0.06825511323081122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,2048,0.0052764444715446895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,3584,0.06042044692569309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,3072,0.0513573322031233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,1024,0.003953777667548922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,2560,0.042436444097095065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,768,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,2048,0.03572355707486471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,1536,0.028777778148651123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,512,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,256,0.0031973332580592898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,1024,0.022658665974934895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,128,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,768,0.019721777902709115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,512,0.01614755557643043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,32,0.00258933338854048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,128,0.012099555797047086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,65536,0.05018044511477152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,64,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,51200,0.04200889004601372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,32,0.011776888536082374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,16384,0.011341333389282227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,12288,0.009701333112186855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,16384,0.2831439971923828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,8192,0.14268267154693604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,10240,0.00904088881280687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,12288,0.21448266506195068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,8192,0.007962666451931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,7168,0.00795911086930169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,10240,0.1796497768825955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,8192,0.14254932933383518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,64,1536,0.004569777597983678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,6144,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,7168,0.12269777721828884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,5120,0.018191999859280057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,4096,0.008734222087595198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,3584,0.008299555215570662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,6144,0.1024728880988227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,5120,0.08433422115113999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,4096,0.06828977664311726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,65536,1.0928115844726562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,64,256,0.012799111505349478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,2560,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,3584,0.06043733490837944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,2048,0.005208888815508948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,1536,0.004580444345871608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,1024,0.004217777815130022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,3072,0.051009777519438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,2560,0.0439991123146481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,2048,0.03496711121665107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,768,0.00387999994887246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,1536,0.028756442997190688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,512,0.0033760000434186724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,128,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,1024,0.02258577777279748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,768,0.019606222709019978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,64,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,512,0.01605422298113505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,256,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,32,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,128,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,64,0.011788444386588203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,32,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2305,32,51200,0.8567315737406412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,3072,0.007603555917739868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2305,32,256,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,16384,2.7819129096137156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,12288,2.2353697882758246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,16384,3.4458594852023654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,16384,3.015730751885308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,12288,2.4449217054578996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,10240,1.9677342308892145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,10240,2.0121021270751953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,12288,2.2841805352105036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,8192,1.5852720472547743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,8192,1.557453367445204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,7168,1.4340978198581273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,51200,8.770679897732204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,10240,1.931728786892361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,7168,1.3629822201199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,8192,1.5603546566433375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,5120,0.7811679840087891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,7168,1.3609324561225042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,6144,1.279495981004503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,5120,0.9856693479749891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,6144,1.1832799911499023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,4096,0.667269335852729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,6144,1.09862306382921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,4096,0.9797671635945638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,3584,0.5674657821655273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,5120,0.9298142327202691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,3584,0.69504091474745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,4096,0.7486044565836588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,3072,0.47681331634521484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,2560,0.39325867758856875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,3072,0.6192951202392578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,3584,0.6636835734049479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,2560,0.570558230082194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,2048,0.33033156394958496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,3072,0.5676328870985243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,2048,0.40628888871934676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,1536,0.2612035539415148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,2560,0.4947839842902289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,1024,0.16614933808644614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,2048,0.4061617851257324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,1536,0.34847111172146267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,768,0.13883999983469644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,1024,0.2916773425208198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,1024,0.24825689527723524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,512,0.10707110828823513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,768,0.19470400280422637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,256,0.08784621953964233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,768,0.20054845015207926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,512,0.17585155698988172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,512,0.16233689255184597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,128,0.06412977642483182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,64,0.05881333351135254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,256,0.1330382161670261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,128,0.10095200273725723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,65536,32,0.060805333985222705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,128,0.1403528849283854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,64,0.13938400480482313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,51200,13.832410176595053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,1536,0.31898755497402614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,256,0.14578755696614584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,65536,32,0.14038756158616808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,65536,51200,10.221328735351562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,16384,2.3294239044189453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,16384,2.7986471388075085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,51200,6.93305163913303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,12288,1.7010924021402996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,16384,2.492200003729926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,65536,8.772030300564236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,10240,1.480031967163086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,12288,1.9424097273084853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,12288,1.8527937995062933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,8192,1.1141466564602323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,10240,1.6303964191012914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,51200,10.869368659125435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,7168,0.8924160003662109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,8192,1.2573892805311415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,10240,1.5405404832628038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,7168,1.0939689212375217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,6144,0.8027057647705078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,8192,1.2030533684624565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,6144,0.9950728946261935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,5120,0.6877724329630533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,51200,8.210946824815538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,7168,0.9970444573296441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,5120,0.7963253127204047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,65536,14.038768344455294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,6144,0.8619022369384766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,4096,0.5513182216220432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,5120,0.7380773226420084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,3584,0.45759020911322695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,4096,0.647799121008979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,3072,0.4260248872968886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,3584,0.5737422307332357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,4096,0.5954666667514378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,2560,0.3369591236114502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,3072,0.4785528712802463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,2560,0.4073822233412001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,3584,0.5225253105163574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,3072,0.4699733522203233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,2560,0.39400000042385525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,1536,0.21207822693718803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,2048,0.32630756166246205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,1024,0.1568791071573893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,1536,0.26495644781324595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,2048,0.32432177331712514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,1024,0.1944542196061876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,768,0.11817422178056504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,1536,0.26327912012736004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,512,0.08547733227411906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,768,0.1572222179836697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,65536,10.451850043402777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,1024,0.25164710150824654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,768,0.16243378321329752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,512,0.13285422325134277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,512,0.13666310575273302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,256,0.062231997648874916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,256,0.11010666688283284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,128,0.11094399955537583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,51200,128,0.08486488792631362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,256,0.14562133948008218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,2048,0.28327645195855033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,32,0.04610666632652283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,64,0.11630933814578587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,51200,32,0.1137662198808458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,128,0.05181866553094652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,51200,64,0.044962667756610446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,16384,0.6833484437730578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,51200,2.166852527194553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,16384,1.0235502454969618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,65536,2.7555991278754344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,12288,0.5144053565131294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,10240,0.4083075523376465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,12288,0.7445031272040473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,12288,0.7681999736362033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,51200,3.887535942925347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,10240,0.6655893325805664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,8192,0.35030044449700254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,10240,0.6338986820644802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,8192,0.5120364295111762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,7168,0.3273386690351698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,65536,4.781909518771701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,8192,0.5093155437045628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,6144,0.29973867204454213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,7168,0.4265040026770697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,5120,0.2557244565751818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,6144,0.38002933396233457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,7168,0.4476017951965332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,5120,0.300784879260593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,6144,0.38240355915493435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,4096,0.16204355822669134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,51200,3.3288186391194663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,4096,0.2392657862769233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,3584,0.14859733316633436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,3072,0.13421421580844456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,5120,0.35748712221781415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,4096,0.26310756471421987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,65536,4.202787611219618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,3072,0.18587022357516816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,2560,0.11650221877627903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,3584,0.2452275488111708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,3072,0.2060906622144911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,2560,0.1587644418080648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,1536,0.07044621970918444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,2048,0.13376800219217935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,2048,0.15262311034732395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,1024,0.04782399866316053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,1536,0.10487377643585205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,1024,0.08029244343439738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,768,0.0388684438334571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,768,0.07902755339940389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,768,0.06584178076850043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,512,0.029881778690550063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,512,0.05476088987456428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,512,0.06581066714392768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,256,0.021747555997636583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,3584,0.21323733859592012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,128,0.019353777170181274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,256,0.04770933257208931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,16384,1.018602689107259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,64,0.016372443901167977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,128,0.04482311010360718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,128,0.04366311099794176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,32,0.016185777054892648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,2560,0.18647378020816377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,64,0.04440800017780728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,16384,32,0.045040001471837364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,1536,0.12162755595313178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,1024,0.09383910894393921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,16384,256,0.05287377701865303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,16384,2048,0.0812551114294264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,16384,0.5465315712822808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,51200,1.6237786610921223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,65536,2.0750925276014542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,16384,0.8169271151224772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,12288,0.3944426642523871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,12288,0.6032480133904351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,16384,0.8682008849249946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,10240,0.3049937884012858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,51200,3.084276411268446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,12288,0.6632195578681098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,10240,0.5060817930433485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,8192,0.27030666669209796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,7168,0.2313466601901584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,8192,0.4025262196858724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,10240,0.5477369096544054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,65536,4.074949476453993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,51200,2.7153875562879772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,8192,0.4350488980611165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,6144,0.17840354972415498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,5120,0.1735466718673706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,7168,0.3735475540161133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,6144,0.29574934641520184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,7168,0.380129787656996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,5120,0.24721511205037436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,6144,0.34036978085835773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,5120,0.27476000785827637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,4096,0.20349155531989205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,3584,0.12495377328660752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,4096,0.1376711130142212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,4096,0.22381244765387642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,3072,0.09501422113842434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,3584,0.17467466990152994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,65536,3.5464488135443797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,2560,0.08478666676415338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,3584,0.2025031116273668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,2048,0.06813777817620172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,3072,0.15372710757785374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,3072,0.1767653359307183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,1536,0.05473955472310384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,2560,0.1310675541559855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,1024,0.03904622130923801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,2560,0.15273688899146184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,2048,0.14164266321394178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,768,0.03074399961365594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,2048,0.11397155125935872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,1536,0.08707022004657322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,1536,0.10585066345002915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,512,0.02273599969016181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,1024,0.06708533234066434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,256,0.017465778523021273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,768,0.05385066734419929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,512,0.05753066804673937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,512,0.045555555158191256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,256,0.046238223711649575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,256,0.0373946660094791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,64,0.013739555246300168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,32,0.013001778059535556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,128,0.0348639984925588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,128,0.03837600019243028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,64,0.0343831115298801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,12288,32,0.033943110042148165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,1024,0.081185777982076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,12288,128,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,51200,1.5058097839355469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,16384,0.47936444812350804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,65536,1.8623538547092016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,12288,0.3790915542178684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,12288,768,0.07203288873036702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,16384,0.7565724584791395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,16384,0.7877013418409559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,10240,0.3006533251868354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,51200,2.704313702053494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,12288,0.6040879885355631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,8192,0.23318399323357475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,12288,0.5875386661953396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,10240,0.44640265570746523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,65536,3.218639161851671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,8192,0.36157067616780597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,7168,0.20360622141096327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,10240,0.5323404206169976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,6144,0.17211466365390352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,7168,0.3084648980034722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,8192,0.425839106241862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,5120,0.14207377698686388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,6144,0.26365688112046987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,7168,0.3491991096072727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,4096,0.11212266816033258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,5120,0.2168062263064914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,6144,0.2999955548180474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,3584,0.09778310855229695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,4096,0.1795599990420871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,4096,0.20704710483551025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,3072,0.08561955557929145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,65536,3.137963612874349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,3584,0.15511377652486166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,2560,0.07287466526031494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,3584,0.18391199906667074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,51200,2.511040793524848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,3072,0.13722044891781277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,2048,0.057757331265343555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,3072,0.16227111551496717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,1536,0.042774223619037204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,2560,0.1195031139585707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,2560,0.13997688558366564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,2048,0.09771111276414658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,1024,0.0307279990779029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,1536,0.09707822402318318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,768,0.023303111394246418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,1024,0.058443552917904325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,1024,0.07512266768349542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,512,0.018087999688254464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,768,0.04772266745567322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,768,0.06515110863579644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,256,0.014488889111412896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,512,0.038556443320380315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,512,0.05358666512701246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,128,0.011962666279739805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,256,0.04337333308325874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,64,0.01108266661564509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,128,0.03495555453830295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,10240,32,0.0114702218108707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,64,0.03052177694108751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,5120,0.25343288315667045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,32,0.030128889613681372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,10240,2048,0.1264115571975708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,1536,0.08150311311086018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,256,0.03268977668550279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,10240,128,0.031207111146714952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,65536,1.361636479695638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,51200,0.9733493593004016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,16384,0.35713866021898055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,12288,0.26937511232164174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,16384,0.6565741962856716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,12288,0.501180436876085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,16384,0.7267448637220594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,10240,0.22860977384779188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,51200,2.3098701900906033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,12288,0.5341395801968044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,65536,2.926558176676432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,10240,0.3924240006340875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,7168,0.16984444194369844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,8192,0.32177689340379506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,10240,0.4484773212009006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,6144,0.13202044698927137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,8192,0.3611733383602566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,7168,0.2701306607988146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,5120,0.11630577511257595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,7168,0.32603467835320366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,6144,0.2289022339714898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,65536,2.7883680131700306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,4096,0.09245600303014119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,5120,0.18956622812483045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,51200,2.180771509806315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,3584,0.08398133516311646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,4096,0.15256178379058838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,3072,0.07247733407550387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,4096,0.1874533361858792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,3584,0.13643022378285727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,3584,0.16957244608137342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,8192,0.186191995938619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,2560,0.059430221716562905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,3072,0.12019466029273139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,2048,0.045797334776984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,3072,0.1577377716700236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,1536,0.035327110025617815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,2560,0.1283244424396091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,2048,0.08635733524958293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,2048,0.10810933510462443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,1536,0.07015199793709649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,1536,0.08817333645290798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,768,0.020488889680968392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,1024,0.06872800323698255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,1024,0.050620443291134305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,512,0.0155404441886478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,768,0.042400889926486544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,256,0.012084444363911947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,768,0.059193776713477246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,512,0.03332533439000448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,512,0.049011554982927114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,128,0.01055466632048289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,256,0.028600888119803533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,256,0.04060533311631944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,64,0.009109333157539368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,6144,0.2718577649858263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,32,0.009339555270142024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,128,0.027079110344250996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,64,0.02717511190308465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,5120,0.22732533348931205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,32,0.02644888891114129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,8192,2560,0.10332000255584717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,8192,1024,0.02552266584502326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,16384,0.36053066783481175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,51200,0.9802684783935547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,8192,128,0.031204445494545832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,65536,1.357192039489746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,12288,0.2748737865024143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,16384,0.6100542280409071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,12288,0.4635173479715983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,10240,0.23066933949788412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,16384,0.6769804424709744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,51200,2.079111099243164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,8192,0.17529688941107857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,12288,0.5888151062859429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,10240,0.374159124162462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,7168,0.16339555051591662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,65536,2.578148523966471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,8192,0.2961306571960449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,8192,0.3462071153852675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,6144,0.12779200077056885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,7168,0.26178932189941406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,7168,0.30371199713812935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,5120,0.11067910989125569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,6144,0.2140871153937446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,51200,2.061902152167426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,6144,0.2560337649451362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,4096,0.08720711204740737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,5120,0.17866933345794678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,5120,0.21708888477749297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,3584,0.07987466785642836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,65536,2.626765357123481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,3072,0.06940711206860013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,4096,0.14276977380116782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,4096,0.17640533712175158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,2560,0.05428533421622383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,3584,0.12627732753753662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,3584,0.16087555885314941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,2048,0.04583200150065952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,3072,0.13937600453694662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,3072,0.11505956119961208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,2560,0.09670755598280166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,10240,0.4376186794704861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,2560,0.12160800562964545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,1024,0.02307555576165517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,2048,0.08018666505813599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,2048,0.10320622391170925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,768,0.020454222957293194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,1536,0.08403555552164714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,1536,0.06366222434573703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,1024,0.04714311162630717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,1024,0.06566933128568861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,256,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,768,0.05613778034845988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,768,0.03918044434653388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,512,0.03150666753451029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,128,0.01039644413524204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,256,0.02644266684850057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,64,0.00924622184700436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,128,0.031168888012568157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,128,0.025016888976097107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,32,0.009554666777451834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,64,0.024749333659807842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,7168,32,0.02443555494149526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,1536,0.0362755556901296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,7168,512,0.01663377715481652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,65536,1.0564417309231229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,512,0.04702044526735941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,7168,256,0.03904177745183309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,16384,0.27969156371222603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,51200,0.9064071443345812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,12288,0.20099022653367785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,16384,0.5335013071695963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,10240,0.17373422781626383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,12288,0.5322355694240993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,16384,0.6341973410712348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,12288,0.4777688980102539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,10240,0.33512088987562394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,8192,0.14576000637478298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,7168,0.1289751132329305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,65536,2.4014275868733725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,8192,0.26713599099053276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,51200,1.8614400227864583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,10240,0.4146417776743571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,8192,0.3231733375125461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,6144,0.10615377955966526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,7168,0.24080265892876518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,5120,0.0894755588637458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,7168,0.283860445022583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,4096,0.07211377885606554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,6144,0.20128444830576578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,5120,0.16262043846978083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,6144,0.2445004516177707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,3584,0.058444446987575956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,5120,0.20955555968814424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,4096,0.13164356019761828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,3072,0.05020266771316528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,65536,2.480470233493381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,4096,0.16926133632659912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,2560,0.04249866803487142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,3584,0.1498319970236884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,3584,0.1171991162829929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,3072,0.1031528910001119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,3072,0.13225421640608045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,1536,0.026172444224357605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,2560,0.11524889204237197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,2560,0.09017155567804973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,51200,1.9170915815565321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,1024,0.0199608885579639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,2048,0.09787911176681519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,2048,0.07437777519226074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,768,0.016735111673672993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,1536,0.05892266829808553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,512,0.012513777448071374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,1536,0.08014577627182007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,1024,0.04418933391571045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,768,0.053915556934144765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,768,0.03660444418589274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,256,0.009936889012654623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,128,0.009012444151772393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,512,0.028540445698632136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,256,0.03575733304023743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,256,0.024409777588314478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,64,0.007653333246707916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,128,0.031178666485680476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,32,0.00794488853878445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,128,0.023079999619060095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,64,0.0229795558585061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,6144,32,0.022655111220147874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,6144,2048,0.03436444534195794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,65536,0.9425990846421984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,51200,0.7412186728583442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,512,0.04377333323160807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,16384,0.2607528898451063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,16384,0.49098931418524844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,12288,0.1868373288048638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,16384,0.6168079906039768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,65536,2.143493228488498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,6144,1024,0.062149332629309766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,51200,1.6685946782430012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,12288,0.3772888978322347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,10240,0.16743644078572592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,8192,0.12955021858215332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,10240,0.3032906585269504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,12288,0.4530346658494737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,8192,0.26576354768541127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,7168,0.11623644828796387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,10240,0.37781066364712185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,6144,0.10219289196862115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,8192,0.304421345392863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,65536,2.2990470462375217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,5120,0.08576177888446385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,6144,0.18068267239464653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,7168,0.27146487765842015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,4096,0.06435110833909777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,51200,1.8041227128770616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,6144,0.22735465897454155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,5120,0.14962311585744223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,3584,0.05694933070076836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,5120,0.190811554590861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,3072,0.04808355702294243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,4096,0.12220356199476455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,2560,0.041646222273508705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,4096,0.15793244043986002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,3584,0.14090577761332193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,3584,0.1077573365635342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,3072,0.09451911184522842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,3072,0.12416356139712864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,1536,0.02680355476008521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,2560,0.10720266898473103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,2560,0.08075288931528728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,1024,0.020421332783169217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,2048,0.06766311327616374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,2048,0.09165866507424249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,1536,0.053344001372655235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,1536,0.0754035578833686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,512,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,1024,0.04019644525316026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,1024,0.058950225512186684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,768,0.033618665403789945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,256,0.009319110876984065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,512,0.026642666922675237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,256,0.03525155451562669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,256,0.02256711158487532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,128,0.007981333467695449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,64,0.007268444531493717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,7168,0.2141582171122233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,128,0.029979556798934937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,128,0.02130399975511763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,64,0.02125066684352027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,5120,32,0.020915556285116408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,2048,0.03446844551298354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,768,0.016923555069499545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,65536,0.7265022065904406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,768,0.05055911011166043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,5120,512,0.04122666517893473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,51200,0.5507733556959364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,16384,0.1833653317557441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,5120,32,0.007278222176763747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,12288,0.13695289029015437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,16384,0.44808175828721786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,10240,0.11988622612423366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,12288,0.33791467878553605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,16384,0.5885270966423882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,12288,0.4490053388807509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,8192,0.09782933526568943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,65536,1.8745316399468317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,10240,0.28270310825771755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,7168,0.09013866715961033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,10240,0.3562355571322971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,8192,0.22594756550259062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,51200,1.4622347089979384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,6144,0.07383377684487237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,8192,0.28905510902404785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,7168,0.1951822174919976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,5120,0.060360888640085854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,7168,0.2480764389038086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,6144,0.16532177395290798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,6144,0.21256000465816924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,4096,0.04651111033227709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,3584,0.04098577631844415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,5120,0.1790613333384196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,4096,0.11023822095659043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,65536,2.147484461466471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,4096,0.1481635570526123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,3072,0.03462310963206821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,2560,0.030978666411505804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,3584,0.09827644295162624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,51200,1.6856169170803492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,3584,0.13179732693566218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,2048,0.024871110916137695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,3072,0.11670311292012532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,3072,0.08559022347132365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,1536,0.020388444264729817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,2560,0.10135022136900161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,2048,0.05942044655481974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,1024,0.014483556151390076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,2048,0.08570400211546157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,768,0.012496888637542725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,1536,0.048060443666246205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,1536,0.0710408886273702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,512,0.00960799968904919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,1024,0.035996443695492215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,768,0.04689244429270426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,768,0.030537777476840552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,256,0.007276444799370236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,512,0.04084088736110263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,512,0.02464444438616435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,128,0.0069155556460221606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,256,0.020582222276263766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,256,0.03291022115283542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,64,0.005933333188295364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,128,0.028100444210900202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,4096,32,0.006223111102978389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,64,0.01953866746690538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,5120,0.13607733779483372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,32,0.01923377811908722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,2560,0.07227377759085761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,65536,0.6781146791246203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,4096,1024,0.05562488900290596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,16384,0.16978932751549614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,4096,128,0.01962844365172916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,16384,0.4241653283437093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,12288,0.13126933574676514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,16384,0.5532675319247776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,12288,0.31907910770840114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,10240,0.1174337731467353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,65536,1.7870311737060547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,51200,0.5140515433417426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,12288,0.4202977816263835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,51200,1.3884639739990234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,8192,0.09220000108083089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,7168,0.08205688661999173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,10240,0.2679591178894043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,8192,0.2142408953772651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,6144,0.06574044624964397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,8192,0.28377334276835126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,7168,0.18627733654446074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,5120,0.05879111422432793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,7168,0.2458266682094998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,6144,0.15646578205956355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,4096,0.04689244429270426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,6144,0.21176711718241373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,5120,0.12968888547685412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,65536,2.1394098069932723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,3584,0.03976266582806905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,5120,0.17778044276767305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,3072,0.033839109871122576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,4096,0.14679733912150064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,51200,1.6776150597466364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,2560,0.029456890291637842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,3584,0.09343110852771336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,3584,0.13133600023057726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,3072,0.11638043986426459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,3072,0.08102222283681233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,2048,0.02531911101606157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,1536,0.020113777783181932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,2560,0.10012088881598578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,2560,0.06857066684299044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,2048,0.05664622121387058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,1024,0.015368888775507608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,1536,0.04569244384765625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,768,0.01236355553070704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,1536,0.07003377543555366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,512,0.010268444816271463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,1024,0.05472266674041748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,1024,0.03429066803720262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,768,0.0473635560936398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,768,0.028925332758161757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,512,0.023592000206311543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,512,0.03803199860784743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,128,0.006621333460013072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,256,0.03222577770551046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,10240,0.3541902171240912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,64,0.005924444645643234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,128,0.018577777677112155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,128,0.02643199927277035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,32,0.005995555470387141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,64,0.018536888890796237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,32,0.018532445033391316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,4096,0.10513066583209568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,65536,0.5446026590135362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3584,2048,0.08525244394938152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,51200,0.4141857888963487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3584,256,0.007272000114123027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,16384,0.14098666773902044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3584,256,0.01979555520746443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,12288,0.10473155313067967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,16384,0.40463733673095703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,12288,0.30444267061021596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,16384,0.5384284655253092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,10240,0.09124444590674506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,65536,1.6733857260810003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,12288,0.39340710639953613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,8192,0.07842577828301324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,10240,0.26213955879211426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,51200,1.3522710800170898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,7168,0.061583108372158475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,10240,0.3307733270857069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,8192,0.20311200618743896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,8192,0.26552976502312553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,6144,0.056872891055213086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,7168,0.1764462259080675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,5120,0.04585777719815572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,7168,0.23144798808627656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,4096,0.03922222057978312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,51200,1.5636587142944336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,65536,1.9931066301133897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,6144,0.19795821772681343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,5120,0.12304977575937907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,3584,0.03148533238304986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,3072,0.02834933333926731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,5120,0.1670560042063395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,4096,0.137990223036872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,4096,0.10020977920956081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,3584,0.08879199955198501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,3584,0.12326221995883518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,3072,0.0770933363172743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,2048,0.019592000378502738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,3072,0.10905866490470038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,1536,0.0158942225906584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,2560,0.06709688901901245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,1024,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,2048,0.05426222085952759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,1536,0.04247644543647766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,1536,0.06588621934254964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,768,0.009701333112186855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,1024,0.0322364436255561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,1024,0.05068711108631558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,512,0.007886221839321984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,768,0.027471999327341717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,768,0.043143110142813794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,256,0.0064311110311084324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,512,0.0222746663623386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,512,0.0374035570356581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,128,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,256,0.01891288823551602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,256,0.031680001152886286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,64,0.0052488889131281115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,32,0.005371555685997009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,128,0.026047110557556152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,64,0.017551110850440133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,6144,0.14902044667137995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,32,0.01754488878779941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,3072,2560,0.023242667317390442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,65536,0.46907822291056317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,51200,0.35687910185919863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,2560,0.09458577632904053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,3072,2048,0.08071200052897136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,16384,0.12738666269514295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,12288,0.10005778074264526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,16384,0.3837440013885498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,3072,128,0.017825777331988018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,12288,0.29504089885287815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,16384,0.515500439537896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,10240,0.08269511328803168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,8192,0.06519289149178399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,12288,0.39255555470784503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,10240,0.2437280019124349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,51200,1.2230382495456271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,65536,1.5511449178059895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,7168,0.05633422401216295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,10240,0.329257779651218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,8192,0.19248799482981363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,6144,0.04699733191066318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,5120,0.04163644380039639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,8192,0.2654995653364393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,7168,0.1674177779091729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,6144,0.1404622263378567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,7168,0.23007554478115508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,4096,0.033407111962636314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,6144,0.19654488563537598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,3584,0.029562665356530085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,5120,0.11657688352796768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,5120,0.16549244191911486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,4096,0.13758844799465603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,3072,0.02684533264901903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,51200,1.5628364351060655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,3584,0.12264711327022976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,3584,0.08449866374333699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,2560,0.02277333372169071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,2048,0.01921066641807556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,3072,0.10815733008914524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,3072,0.07380533218383789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,2560,0.09372622436947292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,2560,0.0619751082526313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,1536,0.015485333071814643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,1024,0.012086222569147745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,2048,0.08017422093285455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,1536,0.0640159977806939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,768,0.010729778144094678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,1024,0.030480888154771592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,1024,0.051121777958340116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,512,0.009015999734401703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,768,0.026047999660174053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,768,0.04284177886115181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,256,0.007461333440409766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,512,0.020962667134073045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,512,0.03685155510902405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,128,0.005375999957323074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,256,0.017859554953045316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,256,0.030663109487957422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,64,0.005221333354711533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,128,0.025412445267041523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,128,0.01681422193845113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2560,32,0.004927111168702443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,4096,0.09355733129713271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,64,0.016542222764756944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2560,65536,1.9883475833468969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,65536,0.34139643775092227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,2048,0.05123555660247803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,51200,0.3004008928934733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,1536,0.04012799925274319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,16384,0.09832355711195205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,16384,0.3594133324093289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,12288,0.06978222396638659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,16384,0.5010711352030436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2560,32,0.016494222813182406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,12288,0.27203554577297634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,65536,1.424021297030979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,10240,0.06196977694829305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,51200,1.1706452899509006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,8192,0.04803644286261665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,12288,0.3681635591718886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,10240,0.2280977831946479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,7168,0.04302488764127096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,10240,0.3067377673255073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,8192,0.1809919940100776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,8192,0.2470160060458713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,6144,0.0370435549153222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,7168,0.15706400076548258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,5120,0.030840890275107488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,51200,1.4472106297810872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,65536,1.8472461700439453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,4096,0.02552177839808994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,3584,0.02386222283045451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,6144,0.13267910480499268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,6144,0.18273777431911895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,5120,0.10935378074645996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,5120,0.15452799532148573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,4096,0.08910133441289265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,4096,0.12786666552225748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,2560,0.01737777723206414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,3584,0.07886933618121676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,3584,0.11446844206915961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,2048,0.014671999547216626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,3072,0.10180977980295818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,3072,0.06879999902513292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,2560,0.05819377634260389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,1536,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,2560,0.0881893303659227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,1024,0.009610666996902889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,2048,0.04732444551255968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,2048,0.07516800032721625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,768,0.008063111040327284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,1536,0.03792444533771939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,1536,0.06190311246448093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,512,0.006919999917348226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,1024,0.048262221945656665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,256,0.0053102220926019884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,768,0.02439822256565094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,768,0.040552000204722084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,128,0.004935111022657818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,512,0.03456799851523505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,512,0.019870221614837646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,64,0.004514666481150521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,256,0.029416001505321924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,256,0.016866667403115165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,32,0.004288889053795072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,128,0.025045333637131587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,128,0.016146666473812528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,64,0.0155395550860299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,32,0.015526221858130561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,2048,7168,0.2147057718700833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,65536,0.30129954550001353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,51200,0.24214487605624727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,2048,3072,0.020281778441535104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,16384,0.07649688588248359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,16384,0.33805423312717015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,2048,1024,0.028598222467634413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,12288,0.056959999932183154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,16384,0.508404466840956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,10240,0.048384000857671104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,51200,1.035919083489312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,12288,0.25548889901902944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,8192,0.03577866819169786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,65536,1.3245955573187935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,12288,0.3631600009070502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,7168,0.033182223637898765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,10240,0.21676266193389893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,10240,0.3053075472513835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,8192,0.17078399658203125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,6144,0.028498666154013738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,8192,0.24551465776231554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,7168,0.14803911579979792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,5120,0.02424888809521993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,7168,0.21318311161465117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,4096,0.020060444871584576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,6144,0.12436089250776504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,51200,1.452999962700738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,6144,0.18175733089447021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,3584,0.017782222893502977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,5120,0.10213422112994724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,65536,1.833497789171007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,5120,0.15318577819400364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,3072,0.016174222032229107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,4096,0.08309155702590942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,2560,0.013735111388895245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,4096,0.12649956014421251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,3584,0.07397066884570651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,3584,0.11391822497049968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,2048,0.012149333126015134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,3072,0.1007502211464776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,1536,0.009729777773221334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,3072,0.06403911113739014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,2560,0.08760977453655666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,2560,0.05414666732152303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,1024,0.007954667011896769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,768,0.0069777775141927935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,2048,0.07413955529530843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,2048,0.044248888889948525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,1536,0.05929866764280531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,1536,0.03489777776930068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,512,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,1024,0.046887109676996865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,1024,0.027099554737408955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,768,0.022967111733224656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,768,0.04049333267741733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,512,0.033950222863091364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,128,0.004530666602982415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,512,0.01904355486234029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,64,0.0041946665280395085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,256,0.015840000576443143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,32,0.003955555458863576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,128,0.02502044373088413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,64,0.01481599940194024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,32,0.0144533332851198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,65536,0.21324533886379668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,51200,0.16989866892496744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1536,256,0.004893333133724001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,16384,0.05430044399367439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1536,256,0.028889778587553237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,51200,0.9616133371988932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1536,128,0.015132443772421943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,65536,1.2298000123765733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,12288,0.039001779423819646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,10240,0.033145778708987765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,16384,0.3153315650092231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,8192,0.025920889443821375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,12288,0.23916623327467176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,10240,0.20060622692108154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,16384,0.43953688939412433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,7168,0.02278222143650055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,12288,0.3351031144460042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,10240,0.28261155552334255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,51200,1.3287475374009874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,6144,0.020367999871571858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,8192,0.15935644838545057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,65536,1.6902373631795247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,8192,0.22673511505126953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,7168,0.13825955655839708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,4096,0.014469333820872836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,7168,0.1961644490559896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,6144,0.11561866601308186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,6144,0.16797778341505262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,3584,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,3072,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,5120,0.09500710831748115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,5120,0.14108267095353869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,2560,0.01038044442733129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,4096,0.11745511160956489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,3584,0.0687991115781996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,3584,0.10515466663572524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,2048,0.008895999855465358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,3072,0.09349955452813043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,2560,0.08111111323038737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,2560,0.0503840015994178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,1536,0.007705777883529663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,2048,0.0407626661989424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,2048,0.06933955351511638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,1024,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,1536,0.03244888782501221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,1536,0.055571556091308594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,768,0.005583999885453119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,1024,0.04366755485534668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,1024,0.025306666890780132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,512,0.004933333231343163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,768,0.021595555875036452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,768,0.03792000148031447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,256,0.004270222038030624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,512,0.017862222260899015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,512,0.03228444523281521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,128,0.0038737778862317405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,256,0.0151591118839052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,256,0.02742133372359806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,64,0.0038151111867692736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,5120,0.017432888348897297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,1024,32,0.0038248888320393036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,128,0.014182221558358936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,64,0.013743110828929476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,32,0.013464888764752282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,65536,0.17800711260901558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,4096,0.07726399766074286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,51200,0.13935289118025038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,1024,3072,0.059458666377597384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,16384,0.04815466536415947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,16384,0.30537867546081543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,12288,0.03108711043993632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,16384,0.43872621324327254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,51200,0.955116483900282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,65536,1.184495078192817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,12288,0.23128178384568956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,1024,128,0.024015110399987962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,10240,0.024474667178259954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,8192,0.024576000041431848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,12288,0.3339262273576524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,7168,0.01874755488501655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,8192,0.15451733271280924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,10240,0.19378222359551323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,10240,0.2817653285132514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,8192,0.22584001223246256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,51200,1.321133295694987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,7168,0.13339377774132624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,5120,0.014135999812020196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,7168,0.19538044929504395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,65536,1.6846532821655273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,6144,0.11168711715274388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,4096,0.014075555735164218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,6144,0.1676337718963623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,5120,0.0914471083217197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,3584,0.010681777364677854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,5120,0.1408568885591295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,3072,0.010683555569913654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,4096,0.07450489203135173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,4096,0.117686218685574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,3584,0.06600355439715914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,2560,0.008622222476535374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,3584,0.10439733664194743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,3072,0.09312355518341064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,2048,0.007771555748250749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,3072,0.057061334451039634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,1536,0.006634666687912411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,2560,0.04775911238458422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,2560,0.07917600207858615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,2048,0.03859466645452712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,1024,0.005229333208666907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,1536,0.03121688961982727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,1536,0.05482044484880236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,768,0.005045333256324132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,512,0.004547555413511065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,1024,0.04326755470699734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,768,0.037428445286220975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,768,0.02092444399992625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,256,0.0038924444880750445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,512,0.01722133325205909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,128,0.003793777690993415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,512,0.032129777802361384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,256,0.014499555031458536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,6144,0.01568266749382019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,128,0.022290666898091633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,128,0.013439999686347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,32,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,64,0.013231111069520315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,65536,0.13608711295657688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,51200,0.10154222117529975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,2048,0.06874399714999728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,1024,0.0243857784403695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,16384,0.03236177894804213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,768,256,0.026994667119450037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,768,64,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,51200,0.8938088946872287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,65536,1.1421395407782662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,16384,0.2941048940022786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,10240,0.01860000027550591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,768,32,0.013088888592190213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,12288,0.22308622466193306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,16384,0.4342924488915338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,8192,0.015556444724400839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,10240,0.1865253316031562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,12288,0.33049511909484863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,7168,0.01408088869518704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,65536,1.6700098249647353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,8192,0.14887466695573595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,10240,0.2790195677015516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,6144,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,8192,0.22352798779805502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,51200,1.3090107176038954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,5120,0.01089777797460556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,7168,0.19389777713351777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,6144,0.1074062254693773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,4096,0.00941955546538035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,6144,0.16655377546946207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,5120,0.08831822209888035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,3584,0.008804444637563493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,5120,0.13981600602467856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,3072,0.007999111380841997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,4096,0.0713004469871521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,12288,0.0226275556617313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,3584,0.10400622420840794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,2560,0.007145778172545963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,3072,0.0540888872411516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,3072,0.09148799710803562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,2560,0.08004799816343519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,2048,0.0373671121067471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,2048,0.06690044535530938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,1536,0.03013333347108629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,7168,0.12813956207699245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,1024,0.004868444469239977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,1536,0.05466577741834852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,1024,0.04321777820587158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,1024,0.0233262214395735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,768,0.00452977791428566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,4096,0.1162853373421563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,768,0.037695109844207764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,768,0.020249777370029025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,512,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,3584,0.0636133352915446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,256,0.0037973332736227247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,512,0.031888888941870794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,512,0.01681511104106903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,128,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,256,0.027033777700530157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,2560,0.045828445090187915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,64,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,32,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,512,128,0.023456000619464453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,128,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,1536,0.005869333528810077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,65536,0.07504622141520183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,32,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,51200,0.05981155236562093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,16384,0.02438755498992072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,51200,0.8572213384840223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,512,2048,0.00656355544924736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,256,0.014097778333557976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,65536,1.0959724850124783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,512,64,0.012724444270133972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,16384,0.2831804487440321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,10240,0.016855110724767048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,12288,0.21483377615610758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,8192,0.01350488927629259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,12288,0.32980799674987793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,16384,0.4323848883310954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,51200,1.3056489096747506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,7168,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,10240,0.18010577890608045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,6144,0.011039999624093374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,10240,0.2778284549713135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,65536,1.6612088945176866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,8192,0.14347733391655818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,5120,0.009704888694816166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,7168,0.12320710553063287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,8192,0.22331288125779894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,7168,0.19290844599405924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,4096,0.00851022203763326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,3584,0.00777599960565567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,6144,0.10330044560962254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,6144,0.1657093365987142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,5120,0.08477155367533366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,5120,0.13956711027357313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,3072,0.007154666715198093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,2560,0.006526222245560751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,4096,0.11515111393398708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,3584,0.06057066387600369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,3584,0.10336089134216309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,2048,0.005550222264395819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,3072,0.05198755529191759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,3072,0.09097333086861505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,1536,0.004853333450025982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,2560,0.07845866680145264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,2560,0.04349955585267809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,12288,0.01763288842307197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,1024,0.00424177779091729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,2048,0.06662933031717937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,2048,0.03568266828854879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,1536,0.02899644441074795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,1024,0.02274311085542043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,1024,0.04284177886115181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,512,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,768,0.019592000378502738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,768,0.03663911090956794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,256,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,512,0.03131466772821214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,512,0.016214221715927124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,128,0.0031519999934567344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,256,0.027098667290475633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,64,0.0030053332448005676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,128,0.012758221891191272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,32,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,64,0.012422222230169507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,32,0.012176888684431711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,65536,0.057711111174689404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,4096,0.06880799929300944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,51200,0.0461751123269399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,256,768,0.0041777777175108595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,1536,0.05411466625001696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,16384,0.01346933344999949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,256,256,0.013146667016877068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,16384,0.2825128767225477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,256,128,0.02177511155605316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,12288,0.014700444208251106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,65536,1.0938569174872506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,51200,0.8569262292650012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,10240,0.012653333445390066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,12288,0.2147066725624932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,8192,0.013047110703256396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,16384,0.4311857753329807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,12288,0.3283582263522678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,10240,0.18013955487145317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,7168,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,10240,0.27693867683410645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,6144,0.010375111467308467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,8192,0.143230226304796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,65536,1.654800838894314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,8192,0.2231431007385254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,7168,0.12317689259847005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,51200,1.2993431091308594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,7168,0.19269066386752656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,4096,0.007660444411966536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,6144,0.10303199953503078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,6144,0.16524444686041936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,3584,0.007263999846246507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,5120,0.08416622214847141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,5120,0.13943555619981554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,4096,0.06816444132063124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,3072,0.006574222197135289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,4096,0.11499288347032334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,2560,0.005881777654091517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,3584,0.060303999318016895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,3584,0.10346311330795288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,2048,0.005261333452330695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,3072,0.0513644450240665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,3072,0.09107999669180976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,1536,0.004583111239804162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,2560,0.042528887589772545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,2560,0.0788959993256463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,1024,0.003911111089918348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,2048,0.03526755505137973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,2048,0.06543022394180298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,768,0.0038986665507157645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,1536,0.02882933285501268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,1536,0.05410755674044291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,1024,0.02233244478702545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,512,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,256,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,768,0.03646844294336107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,768,0.019560888409614563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,128,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,512,0.016162667009565566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,512,0.03081511126624213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,64,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,256,0.0131217779384719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,256,0.026739555928442214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,32,0.0029075555503368378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,128,0.02127200033929613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,64,0.012072888513406118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,32,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,128,5120,0.008989333278603023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,51200,0.04407199886110094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,16384,0.016766221986876596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,12288,0.01315822203954061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,10240,0.012107555237081317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,16384,0.2826480070749919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,10240,0.17934577994876436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,8192,0.01073688848151101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,7168,0.010414222048388587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,8192,0.14302844471401638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,7168,0.12242310576968723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2304,128,1024,0.04248799880345663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,51200,0.8557662434048123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,5120,0.009473777479595607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,4096,0.007937777373525832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,65536,1.0945955912272136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,6144,0.1028675569428338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,3584,0.007585778004593319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,5120,0.08387200037638347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,128,128,0.012096888489193387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,4096,0.06807377603318956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,3072,0.006899555524190267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,2560,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,65536,0.05372800098525154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,2048,0.005225777626037598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,1536,0.004588444613748127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,3584,0.05980000231001112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,3072,0.0510480006535848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,1024,0.004208000169859992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,2560,0.04244800077544319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,768,0.0035626664757728577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,2048,0.03503377901183234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,512,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,256,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,1536,0.028757333755493164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,128,0.002874666617976295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,768,0.01924088928434584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,512,0.015847999188635085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,12288,0.21435288588205972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,256,0.01295111080010732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,32,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,128,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,65536,0.04892266790072123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,64,0.012083555261294046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,32,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,51200,0.04121511181195577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,16384,0.01038755559258991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,12288,0.008980444735950893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,6144,0.00942666663063897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,10240,0.008407110969225565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,16384,0.2826160060034858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,12288,0.21456800566779244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,8192,0.007791111038790808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,7168,0.007324444750944774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,10240,0.17910667260487875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,6144,0.007606222397751278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,8192,0.1423191097047594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,7168,0.12271111541324192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,5120,0.007263110743628607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,4096,0.014807111687130399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,51200,0.8550320201449924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,6144,0.1020151111814711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,3584,0.013792888985739814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,64,1024,0.02234755622016059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,3072,0.012088889049159156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,5120,0.08375733428531223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,65536,1.0920133590698242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,64,64,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,2560,0.01036088913679123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,4096,0.06795199712117513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,2048,0.0052622221410274506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,3584,0.06002489063474867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,1536,0.00452533322903845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,1024,0.003891555385457145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,768,0.0038648889296584656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,3072,0.05102755626042684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,512,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,2560,0.04225066635343763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,256,0.002934222213096089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,2048,0.03487644592920939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,1536,0.028780443800820246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,128,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,1024,0.022286223040686712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,768,0.01958666741847992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2304,32,32,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,512,0.015848888291252982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,256,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,64,0.011737777955002256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,128,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2304,32,32,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,10240,1.7153715557522242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,10240,1.8900693257649739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,12288,2.1207938724093967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,12288,2.254688051011827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,16384,2.681666692097982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,8192,1.3413884904649522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,16384,3.1447387271457248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,7168,1.1824507183498807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,8192,1.4150898191663954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,6144,1.0616871515909831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,7168,1.2380630705091689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,5120,0.8306524488661023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,4096,0.6458569102817112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,3584,0.563378651936849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,6144,1.0584061940511067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,5120,0.9074302249484592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,4096,0.7496159871419271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,3072,0.5461013582017686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,3584,0.639595561557346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,2560,0.4650142457750108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,3072,0.5652097596062554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,2560,0.4523990948994954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,2048,0.34548266728719074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,1536,0.2574088838365343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,1024,0.20092799928453234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,1024,0.2215893268585205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,1536,0.34811822573343915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,2048,0.41630310482449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,512,0.11052711142434014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,768,0.19829511642456055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,256,0.07955911424424914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,128,0.06521599822574191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,512,0.1610977782143487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,64,0.05575911204020182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,256,0.1400408877266778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,128,0.13007111019558376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,32,0.05626933442221748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,64,0.1305039988623725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,32,0.13127288553449842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,768,0.14680177635616726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,65536,51200,8.571401807996962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,16384,2.0250462426079645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,12288,1.4872631496853297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,12288,1.8055288526746962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,16384,2.551234563191732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,10240,1.3572702407836914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,10240,1.4850951300726996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,8192,0.9744924969143338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,51200,6.361918131510417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,65536,51200,12.689301384819878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,8192,1.1982222663031685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,7168,0.7792275746663412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,6144,0.8270782364739312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,6144,0.8781706492106119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,7168,1.0265092849731445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,5120,0.6053359773423936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,4096,0.5662150912814671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,3584,0.3926808834075928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,65536,8.142990960015192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,5120,0.740264892578125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,3072,0.3733875486585829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,4096,0.5655600229899088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,2560,0.3304968939887153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,3584,0.5491733551025391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,3072,0.4544569121466742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,2560,0.3665733337402344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,2048,0.24869243303934732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,1024,0.13370666238996717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,768,0.10486311382717556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,1536,0.24090933799743652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,2048,0.2963502142164442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,512,0.07999466525183783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,256,0.056679109732309975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,1024,0.1785093281004164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,768,0.1453582180870904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,1536,0.19231111473507354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,512,0.12337511115603977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,64,0.041617777612474226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,32,0.042057779100206166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,256,0.12090933322906494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,128,0.10316089126798843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,64,0.10681422551472981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,32,0.10375199715296428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,51200,9.961950514051649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,16384,0.6692346466912164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,51200,128,0.04728177852100796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,12288,0.514286200205485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,12288,0.6818453470865885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,16384,0.9681875440809461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,10240,0.40064356062147355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,51200,2.13356802198622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,8192,0.29884976810879177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,7168,0.31300534142388237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,10240,0.5656631257798936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,65536,2.689057879977756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,8192,0.47104088465372723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,7168,0.39878132608201766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,6144,0.2750808927747938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,5120,0.22772532039218477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,6144,0.3305902216169569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,5120,0.2793697781032986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,51200,65536,12.379513210720487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,4096,0.17040267255571154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,3072,0.12763999568091497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,4096,0.25701244672139484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,3584,0.19406399461958143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,2048,0.08044266700744629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,3072,0.18336089452107748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,2560,0.14614400598737928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,1536,0.06564978096220228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,1024,0.0461386673980289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,2048,0.12053778436448838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,768,0.03459111187193129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,51200,3.5325707329644094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,1536,0.10065688689549764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,1024,0.07488266626993816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,256,0.021363554729355708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,768,0.0607831080754598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,128,0.018220444520314533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,64,0.015776889191733468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,512,0.052391111850738525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,256,0.04468799961937798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,32,0.016392888294325936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,128,0.04076000054677328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,64,0.040660444233152605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,32,0.039164443810780845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,3584,0.15828711456722683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,16384,65536,4.203252580430773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,2560,0.10865155855814616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,16384,512,0.02843022346496582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,16384,0.48922310935126406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,12288,0.3703671031528049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,16384,0.7415511343214246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,51200,1.545347531636556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,10240,0.30192356639438206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,12288,0.649455123477512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,8192,0.26033955150180393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,65536,2.0628329383002386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,10240,0.45547109180026585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,7168,0.20972888999515107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,8192,0.38072623146904844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,5120,0.16160710652669272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,6144,0.2082151174545288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,7168,0.34806132316589355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,6144,0.26623378859625924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,4096,0.13134311305152044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,5120,0.23245954513549805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,3584,0.11059644487169053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,4096,0.20399022102355957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,3584,0.15883110629187688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,2560,0.08164799875683255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,2048,0.06942044364081489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,1536,0.050823999775780566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,3072,0.14055200417836508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,2560,0.12369333373175727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,1024,0.03444177905718485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,768,0.02716800073782603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,2048,0.09970221916834514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,1536,0.08343999915652806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,256,0.01796533332930671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,1024,0.06083466609319051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,768,0.04983199967278374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,128,0.014134221606784396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,512,0.04012088974316915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,64,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,51200,2.7751235961914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,32,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,256,0.035409778356552124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,128,0.032412442896101214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,64,0.03216977914174398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,32,0.03492533498340183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,12288,65536,3.5976443820529513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,3072,0.09591644340091282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,16384,0.38134222560458714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,12288,0.3056311077541775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,12288,512,0.02149155570401086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,16384,0.6796639760335287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,10240,0.2418888939751519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,51200,1.258273760477702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,12288,0.5006595717536079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,8192,0.20100533962249756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,7168,0.19647022088368735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,10240,0.4036666552225749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,65536,1.6240115695529516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,6144,0.1496444410747952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,5120,0.11920000447167291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,8192,0.34173067410786945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,4096,0.10178844134012859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,3584,0.08669955862892999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,6144,0.3001493348015679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,3072,0.07867999871571858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,4096,0.15961066881815592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,5120,0.2432337866889106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,3584,0.15264177322387695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,2560,0.06330577532450359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,2048,0.05429955654674106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,1536,0.038768000072903104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,1024,0.027963555521435205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,3072,0.13833688365088567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,2560,0.10806400246090359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,768,0.024484443995687697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,1536,0.07454755571153429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,512,0.019474666979577806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,256,0.015305777390797934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,768,0.04504444532924228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,512,0.03597955571280585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,128,0.012038222617573209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,51200,2.277589374118381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,256,0.03026755650838216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,32,0.010423999693658618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,128,0.029161777761247423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,64,0.029184887806574505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,32,0.028788444068696763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,7168,0.28017600377400714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,65536,3.0207396613227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,16384,0.33475645383199054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,2048,0.0943982203801473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,10240,1024,0.055071999629338585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,12288,0.24632000923156738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,10240,64,0.01034400032626258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,51200,1.0383439593844943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,65536,1.310896873474121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,10240,0.20516355832417807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,8192,0.19022044870588514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,16384,0.6166675355699327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,12288,0.42266045676337344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,7168,0.14659289518992105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,10240,0.3525422149234348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,6144,0.1322151157591078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,5120,0.10515289174185859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,8192,0.30068445205688477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,7168,0.29296800825330943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,6144,0.2251208888159858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,4096,0.07674044370651245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,5120,0.17699021763271758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,3072,0.06028622388839722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,4096,0.14510044786665174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,2560,0.0506897767384847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,3584,0.13383732901679143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,2048,0.04391466577847799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,3072,0.11285421583387588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,1536,0.03369955552948846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,51200,1.9864603678385417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,1024,0.025175111161337957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,768,0.019096000327004325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,2048,0.079839997821384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,1536,0.06365066766738892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,512,0.01536711057027181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,256,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,1024,0.04920444554752774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,768,0.039585779110590615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,512,0.03185688787036472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,64,0.008740444150235917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,65536,2.570416980319553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,128,0.025757332642873127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,32,0.01033155537313885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,64,0.02557777696185642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,32,0.025322667426533167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,3584,0.07703644699520536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,2560,0.09606666697396173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,51200,0.802592913309733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,16384,0.29246756765577525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,8192,128,0.010610666539933948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,65536,1.1683786180284288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,8192,256,0.02677511175473531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,12288,0.2202062209447225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,10240,0.200708442264133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,8192,0.1533422205183241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,12288,0.39332087834676105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,10240,0.3301653332180447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,7168,0.13531466325124106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,16384,0.5556666586134169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,6144,0.1125333309173584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,8192,0.30155732896592885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,5120,0.09028977817959255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,7168,0.2255857785542806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,4096,0.08137422137790255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,3584,0.06315466430452135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,6144,0.22564533021714953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,5120,0.1604426701863607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,3072,0.0543066660563151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,4096,0.13396533330281576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,2560,0.04682755470275879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,2048,0.0359866652223799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,3584,0.11909600098927815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,51200,1.8363094329833984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,1536,0.030629333522584703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,3072,0.11963555547926162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,1024,0.022476444641749065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,2560,0.0887591110335456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,2048,0.07311199771033393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,65536,2.323855929904514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,512,0.014476444986131458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,1536,0.059727112452189125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,256,0.011188444164064197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,1024,0.0433884428607093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,64,0.008967111508051554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,32,0.009337777892748514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,512,0.02882755464977688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,256,0.024863110648261175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,128,0.02411288850837284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,64,0.023741333021057978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,32,0.025036444266637165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,16384,0.25270578596327037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,51200,0.7429137759738498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,65536,1.018423080444336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,768,0.018381334013409086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,12288,0.19693599806891549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,16384,0.5279742346869575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,7168,128,0.009359111388524374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,10240,0.1657608879937066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,7168,768,0.037420445018344455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,7168,0.11513955063290066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,8192,0.2396248976389567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,6144,0.09990488820605808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,10240,0.3454924424489339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,7168,0.2080319987403022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,5120,0.078274667263031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,4096,0.06617599725723267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,51200,1.6240719689263239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,3584,0.05809599823421902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,6144,0.1758613321516249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,5120,0.15252710713280573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,3072,0.04830844534767998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,4096,0.12452710999382867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,2560,0.0421324438518948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,2048,0.03506933318244086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,3584,0.11028355360031128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,3072,0.09354933102925618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,2560,0.08176977766884698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,65536,2.079719967312283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,1024,0.021282666259341772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,2048,0.06967466407352023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,768,0.015826667348543804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,512,0.012246222131782107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,1536,0.054062220785352916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,256,0.009716444545321995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,1024,0.040716442796919085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,128,0.008612444831265343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,768,0.03530844383769565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,512,0.0270471109284295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,64,0.007657777931955125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,8192,0.13229066795772976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,32,0.007828444242477417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,256,0.023079999619060095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,128,0.02235377828280131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,64,0.022042666872342426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,32,0.021980444590250652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,6144,12288,0.4229111141628689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,16384,0.21420621871948242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,12288,0.15965688228607178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,16384,0.4468204180399577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,51200,0.6335413191053603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,6144,1536,0.027691556347741023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,65536,0.8693715731302897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,10240,0.13186932934655085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,8192,0.10423644383748372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,7168,0.08949333429336548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,12288,0.3358177873823378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,6144,0.08190311325920953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,10240,0.29407911830478245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,8192,0.23387556605868867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,5120,0.0684444440735711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,7168,0.18978133466508654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,4096,0.05138577686415779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,3584,0.04534133275349935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,3072,0.03836266530884637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,5120,0.13704089323679605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,4096,0.11817333433363174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,2560,0.03285955720477634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,3584,0.10030666987101237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,2048,0.02868088748719957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,51200,1.4930506812201605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,1536,0.02163644466135237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,3072,0.08500978019502427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,1024,0.016528889536857605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,2560,0.07490222321616279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,768,0.013120888835854001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,2048,0.06157244576348198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,512,0.010275555153687796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,256,0.008332444561852349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,1536,0.048716445763905845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,1024,0.0370417767100864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,128,0.007297777467303806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,65536,1.9268417358398438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,768,0.032257778777016535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,64,0.006615110983451207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,512,0.025241777300834656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,256,0.021352888809310064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,128,0.020616888999938965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,64,0.02068444424205356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,32,0.020298666424221463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,16384,0.16319555706448025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,51200,0.43073511123657227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,5120,6144,0.16101866298251682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,65536,0.596235540178087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,12288,0.12730844815572104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,10240,0.11536710792117649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,16384,0.4044106536441379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,8192,0.08995199865765041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,12288,0.3030880027347141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,7168,0.07781155241860284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,6144,0.06648177570766874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,10240,0.2611244519551595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,8192,0.20066132810380724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,5120,0.05445422066582573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,7168,0.1904062165154351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,4096,0.04418666826354133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,3584,0.039451556073294744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,6144,0.14716000027126735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,3072,0.03380089004834493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,5120,0.12544443872239855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,4096,0.10072533289591472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,2560,0.02914488977856106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,3584,0.08939733107884724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,51200,1.326067606608073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,2048,0.025096888343493145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,1536,0.019596444235907663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,3072,0.07800088988410102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,2560,0.06692177719540067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,2048,0.054551111327277295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,1536,0.04489244355095757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,65536,1.6858338250054254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,256,0.0073902226156658595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,768,0.028901331954532202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,128,0.006577777779764599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,512,0.02308799988693661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,256,0.01980444457795885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,64,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,128,0.018927110566033255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,32,0.005884444548024072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,64,0.01887022289964888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,32,0.01835911141501533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,5120,32,0.0069120000633928515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,1024,0.015494222442309061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,65536,0.5410986476474339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,768,0.012014221813943652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,51200,0.4333626694149441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,4096,1024,0.033356444703208074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,16384,0.15960800647735596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,12288,0.11207111676534016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,10240,0.09498400158352321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,8192,0.0767315559917026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,16384,0.38310933113098145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,12288,0.2895422246721056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,7168,0.06525778108172946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,10240,0.2644346555074056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,6144,0.057357331116994224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,5120,0.04734933376312256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,8192,0.21421066919962564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,7168,0.16518755753835043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,4096,0.039495110511779785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,6144,0.14485332700941297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,3584,0.03688888748486837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,3072,0.03198666705025567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,4096,0.09558666414684719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,2560,0.026290666725900438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,3584,0.08761066860622829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,65536,1.5946177376641169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,2048,0.022823111878501043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,3072,0.07613688707351685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,51200,1.2462284300062392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,2560,0.06452266375223796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,1024,0.01424088908566369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,4096,512,0.009348444640636444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,768,0.011415999796655444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,2048,0.053358223703172475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,512,0.00964355551534229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,1536,0.04398311177889506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,256,0.00868711123863856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,1024,0.031720889939202204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,128,0.006215999937719769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,64,0.005577777822812398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,256,0.01905333333545261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,32,0.0059004442559348206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,128,0.018206222189797294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,64,0.017843556072976854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,32,0.01756266587310367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,65536,0.4845031102498372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,5120,0.11766221788194443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,51200,0.38831289609273273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,16384,0.13172622521718344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3584,1536,0.018446221947669983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,12288,0.09622844722535874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,10240,0.09240000115500556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,16384,0.4155413309733073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,768,0.027952889601389568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,12288,0.2750017907884386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,8192,0.07276088661617704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,7168,0.062352001667022705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,10240,0.22836621602376303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,6144,0.0520648890071445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,5120,0.04571111003557841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,8192,0.17997333738538954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,4096,0.03534844517707825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,7168,0.161244445376926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,3584,0.03128177920977274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,65536,1.4937004513210719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,3072,0.027676444914605882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,5120,0.11089599794811672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,2560,0.02404533326625824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,4096,0.09041777584287856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,2048,0.020377778344684176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,3584,0.08425866895251805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,51200,1.222087966071235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,1536,0.016321778297424316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,3072,0.07117155525419447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,1024,0.012764444781674279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,768,0.010432889064153036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,2048,0.0499511096212599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,1536,0.04004977809058295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,1024,0.02991822361946106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,256,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,768,0.02604622145493825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,128,0.005629333357016246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,64,0.005038222091065513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,512,0.021309332715140447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,32,0.005388444496525659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,256,0.018204443984561496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,128,0.017495999733606975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,64,0.016887111796273124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3584,512,0.02251111136542426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,32,0.017027555240525138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,16384,0.10817511214150323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,65536,0.42576445473565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,12288,0.0897759993871053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,16384,0.3433573246002197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,2560,0.06014133161968655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,3072,512,0.008421333299742805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,10240,0.08124177985721164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,12288,0.2585955460866292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,8192,0.06656533479690552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,7168,0.05737777551015218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,51200,1.0901102489895291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,10240,0.21630311012268066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,8192,0.17029333114624023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,6144,0.04963111215167575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,65536,1.3981333838568792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,5120,0.040834665298461914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,7168,0.14744177129533556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,4096,0.03323555654949612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,6144,0.1248942216237386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,3584,0.02853511108292474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,3072,0.02474755545457204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,51200,0.3404408825768365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,2560,0.021716444028748408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,4096,0.08601333035363092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,2048,0.018205333087179396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,3584,0.07631199889712863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,3072,0.06640711095598009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,1536,0.014819555812411837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,3072,6144,0.13419466548495823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,1024,0.011399110986126794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,768,0.009357333183288574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,2560,0.05674844317966037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,512,0.007300444775157505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,1536,0.037237332926856145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,256,0.005952000204059813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,1024,0.02846933404604594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,128,0.00554933316177792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,768,0.02453244394726223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,64,0.0052044445441828836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,512,0.019955555597941082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2560,32,0.005264889034960005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,256,0.017217778497272067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,128,0.016506666938463848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,64,0.016181333197487723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,32,0.01585422290696038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,16384,0.09942844178941514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,51200,0.264519108666314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,65536,0.3283262252807617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,12288,0.06854489114549425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,10240,0.057427558634016246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,16384,0.3278222348954943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,12288,0.2589342329237196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,5120,0.10458133618036906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,8192,0.046909332275390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,7168,0.03860355416933695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,10240,0.21336000495486787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,6144,0.0328693323665195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,5120,0.02756888833310869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,4096,0.02290133304066128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,8192,0.1660648849275377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2560,2048,0.04676533407635159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,7168,0.14047022660573324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,3584,0.021244444780879553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,6144,0.12287022007836236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,3072,0.01864622202184465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,51200,1.018254174126519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,2560,0.01669066647688548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,5120,0.09998489088482326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,4096,0.08153777652316622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,3584,0.07292266686757405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,3072,0.06383111079533894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,1024,0.009319110876984065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,2560,0.05373511049482557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,65536,1.3021066453721788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,768,0.007983999947706858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,2048,0.044813334941864014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,512,0.006722666737106111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,256,0.005227555417352253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,1536,0.03562488820817735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,128,0.004634666774008009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,1024,0.027449778384632532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,64,0.004313777718279096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,768,0.0236462222205268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,32,0.004257777912749184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,256,0.015956444872750174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,128,0.015455999308162265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,64,0.015483554866578845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,32,0.01513066722287072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,16384,0.07328710953394572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,65536,0.26991645495096844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,51200,0.22458132108052573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,12288,0.05519377854135302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,10240,0.04614399870236715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,16384,0.3070053259531657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,12288,0.23195823033650717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,8192,0.03585066729121738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,10240,0.19691377215915254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,7168,0.03226577904489305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,6144,0.026816000541051228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,1536,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,8192,0.15222222275204128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,5120,0.023372444841596816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,7168,0.13242488437228733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,4096,0.020113777783181932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,6144,0.11153511206309001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,3584,0.017996443642510306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,5120,0.09309155411190456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,2048,512,0.01924533314175076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,4096,0.07624710930718316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,65536,1.2033519744873047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,2560,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,3584,0.06813955307006836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,2048,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,1536,0.010046222143703038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,3072,0.058816889921824135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,2560,0.0499893327554067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,1024,0.008294222255547842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,768,0.007000889215204451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,2048,0.041329777903027005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,1536,0.032794667614830866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,512,0.006255110932721033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,1024,0.02546666728125678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,256,0.004923555586073133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,768,0.02216266592343648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,128,0.004876444323195351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,64,0.004522666749027041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,512,0.018058665924602084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,256,0.015461333923869662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,32,0.004851555658711327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,128,0.0148026661740409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,64,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,32,0.014333332578341166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,2048,2048,0.014039999908871122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,65536,0.19682755735185412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,16384,0.05094044407208761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,51200,0.14998222721947566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,12288,0.04051733348104689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,10240,0.031097776359981958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1536,51200,0.9417102601793078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,8192,0.024315555890401203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1536,3072,0.01607733302646213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,12288,0.21624978383382162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,7168,0.021419554948806763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,10240,0.18053244219885933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,6144,0.018900444110234577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,8192,0.1418222188949585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,7168,0.12264266279008652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,4096,0.014588443769348992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,5120,0.08632177776760525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,51200,0.8692648675706652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,3584,0.012873777912722694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,3072,0.011410666836632622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,4096,0.07033244768778484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,65536,1.106487062242296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,2560,0.010341333018408881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,2048,0.008671110702885522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,3584,0.062427553865644664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,3072,0.053789334164725415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,1536,0.007657777931955125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,2560,0.0454675555229187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,2048,0.037540445725123085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,768,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,1536,0.03049955434269375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,512,0.004907555464241239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,1024,0.023753777146339417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,256,0.004214222232500712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,768,0.020637333393096924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,128,0.0041982221106688184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,512,0.01720711092154185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,16384,0.286368899875217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,64,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,32,0.004176889028814104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,128,0.013753777576817406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,5120,0.017052445146772597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,64,0.013737777868906656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,32,0.013451555536852943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,65536,0.15462666087680393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,51200,0.12455999851226807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,6144,0.10374044709735447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,16384,0.039677331844965615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,12288,0.030343112018373277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,10240,0.0247013337082333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,16384,0.27601777182685006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,12288,0.20905600653754342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,10240,0.17380800512101915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,1024,1024,0.006520888871616787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,7168,0.018574222922325134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,6144,0.01612977849112617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,5120,0.014397333065668741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,8192,0.13676267200046116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,4096,0.012152888708644442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,7168,0.11832622687021892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,6144,0.09891555706659953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,3584,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,51200,0.8359120157029895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,5120,0.08276977803972033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,3072,0.010048000348938836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,2560,0.008956444760163626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,1024,256,0.014470222923490735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,2048,0.00794222205877304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,4096,0.0675848921140035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,1536,0.0069644442862934535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,1024,0.005896889087226655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,2560,0.04317422376738655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,2048,0.03530222177505493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,1536,0.029513776302337646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,768,0.004905777672926585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,1024,0.022984888818528917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,768,0.020263999700546265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,256,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,512,0.01663644446267022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,128,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,256,0.014138667119873894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,64,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,8192,0.020609777834680345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,128,0.013406222065289816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,32,0.0038924444880750445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,64,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,32,0.012842666771676807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,65536,0.11841421657138401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,51200,0.08993689219156902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,16384,0.03944622145758735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,65536,1.0652071634928386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,3584,0.05953511264589098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,768,3072,0.05176000131501091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,12288,0.02757511039574941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,10240,0.023331556055280898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,8192,0.01940533353222741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,768,512,0.004204444587230682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,16384,0.2653413348727756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,12288,0.2006231149037679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,7168,0.017633777525689866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,10240,0.16787555482652453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,6144,0.015814221567577787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,5120,0.013364444176355997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,8192,0.13121867179870605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,4096,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,3584,0.010616888602574667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,51200,0.8030088742574056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,7168,0.11358933978610569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,6144,0.09511288669374253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,3072,0.009348444640636444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,5120,0.07932088772455852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,2560,0.008647110727098253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,65536,1.0248115327623155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,4096,0.06478666596942477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,2048,0.007266666326257918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,3584,0.057463109493255615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,1024,0.0052435555391841466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,3072,0.048864000373416476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,1536,0.006257777826653586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,768,0.004875555634498596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,2560,0.042118221521377563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,512,0.004184000194072723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,2048,0.03398844599723816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,256,0.003565333369705412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,1536,0.028099556763966877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,128,0.003690666622585721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,1024,0.022293332550260756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,768,0.01960444450378418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,64,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,512,0.016158221496476066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,512,32,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,256,0.013743110828929476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,128,0.01276177747382058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,65536,0.07688089211781819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,51200,0.062296887238820396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,64,0.012786666552225748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,512,32,0.01238044434123569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,16384,0.023054222265879314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,12288,0.018598222070270114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,10240,0.01594577729701996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,8192,0.013371555341614617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,7168,0.012264889147546558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,12288,0.19259999858008492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,16384,0.25413865513271755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,8192,0.12613244851430258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,6144,0.010729778144094678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,7168,0.10792444149653117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,5120,0.009655111365848118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,4096,0.00829777783817715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,3584,0.007537778053018782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,5120,0.07604177792867024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,6144,0.09092977974149917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,4096,0.06253600120544434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,3072,0.006969778074158563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,2560,0.006217777729034424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,3584,0.05444000164667765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,2048,0.005610666755172942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,1536,0.004865777575307422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,3072,0.045904888047112354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,2560,0.03996444410747952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,65536,0.9794178009033203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,1024,0.004228444563017951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,2048,0.03220444586541917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,768,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,512,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,1536,0.027122666438420612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,256,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,1024,0.02164177762137519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,128,0.003216888962520493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,768,0.018868444694413077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,512,0.01568888955646091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,64,0.0029013332807355454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,256,32,0.002961777771512667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,256,0.013111111190583972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,128,0.01242844429281023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,64,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,65536,0.05228888988494873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,32,0.011773332953453064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,16384,0.016511110795868766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,51200,0.042451557185914784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,12288,0.013809777796268463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,10240,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,10240,0.16070489088694254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,8192,0.011407111254003314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,12288,0.19223911232418486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,16384,0.25375554296705455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,10240,0.1603964434729682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,7168,0.0107004443804423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,6144,0.01038044442733129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,5120,0.009349333743254343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,8192,0.12513244152069092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,256,51200,0.7679120169745551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,7168,0.10825422075059678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,6144,0.09020266930262248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,3584,0.007664889097213745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,51200,0.7659031020270454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,3072,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,5120,0.0755573312441508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,2560,0.00628977765639623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,4096,0.061127112971411816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,3584,0.05371733175383674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,65536,0.9776177936130099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,3072,0.045956446064843066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,1536,0.004899555610285865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,2560,0.03944977786805894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,1024,0.0041804446114434134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,2048,0.03239555491341485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,512,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,1536,0.027012444204754297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,1024,0.021356445219781663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,256,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,768,0.01862044466866387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,128,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,64,0.002789333255754577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,512,0.015480000111791821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,32,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,256,0.01316177762216992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,128,0.012103999654452005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,65536,0.050804442829555936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,32,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,51200,0.03899466660287645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,16384,0.013109332985348172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,4096,0.007992888490358988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,12288,0.014071111877759298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,16384,0.2535208861033122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,10240,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,2048,0.005264889034960005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,8192,0.011063999599880643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,12288,0.1915724409951104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,128,768,0.003899555653333664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,7168,0.01035377797153261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,51200,0.7668364312913684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,6144,0.009682666924264696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,8192,0.12543733914693198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,65536,0.976835568745931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,5120,0.008996444443861643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,4096,0.00794577764140235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,7168,0.10761333174175686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,3584,0.007311999797821045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,6144,0.08994933631685044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,3072,0.006611555400821898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,2560,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,5120,0.0751697752210829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,128,64,0.011966221862369113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,2048,0.0052586665583981415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,1536,0.004869333157936732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,3072,0.04651644494798449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,2560,0.03909511036343045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,1024,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,2048,0.032235556178622775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,768,0.003839111162556542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,512,0.003216000066863166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,1536,0.027081777652104694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,256,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,1024,0.021261332763565913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,128,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,512,0.015471110741297403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,64,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,256,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,64,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,128,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,65536,0.04805688725577461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,64,0.011767110890812345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,51200,0.03970488905906677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,32,0.011748444702890186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,16384,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,12288,0.009389333426952362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,10240,0.16015911102294922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,10240,0.009069333473841349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,16384,0.25365689065721303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,12288,0.19223999977111816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,8192,0.00794666674402025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,10240,0.1601004468070136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,7168,0.007626666790909237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,3584,0.053640001349978976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,6144,0.007603555917739868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,8192,0.12499199973212348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,5120,0.010683555569913654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,51200,0.7662631140814887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,7168,0.10786577728059556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,4096,0.00943288869327969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,6144,0.08984533283445571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,65536,0.9765564600626627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,768,0.018533334136009216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,3072,0.00795022232664956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,5120,0.07541066408157349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,2560,0.0069679998689227635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,4096,0.06069778071509468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,2048,0.0052488889131281115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,3584,0.05370133452945285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,1536,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,1024,0.0038897775941424896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,2560,0.03810311026043362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,2048,0.03226577904489305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,768,0.003670222229427762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,1536,0.02684266699684991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,512,0.0031519999934567344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,1024,0.02126311096880171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,256,0.0028817777832349143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,128,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,768,0.01871555546919505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,64,0.002516444358560774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,256,0.012749333348539142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,32,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,128,0.01216533366176817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,64,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,64,4096,0.06093155675464206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,32,0.011690666278203329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2049,32,3584,0.008631111019187504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,3072,0.04551377892494202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2049,32,512,0.015464888678656684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,16384,2.471077389187283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,12288,1.8544267018636067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,16384,3.0656204223632812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,10240,1.5518710878160265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,12288,2.195102267795139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,16384,2.7515377468532987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,10240,1.7852906121148004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,12288,2.0498008728027344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,8192,1.3278907140096028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,8192,1.4470418294270833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,7168,1.103519121805827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,51200,7.764228820800781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,10240,1.7505244149102106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,7168,1.2337680392795138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,8192,1.3330657747056749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,6144,0.9266693327162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,5120,0.7390684551662869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,7168,1.1509404712253146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,5120,0.864033752017551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,6144,1.0282861921522353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,4096,0.6360498004489475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,6144,0.96142578125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,3584,0.47650935914781356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,5120,0.8011813163757324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,4096,0.7202915615505643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,3584,0.6217973497178819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,3072,0.4482044643825955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,4096,0.6481591330634223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,2560,0.34529778692457413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,3072,0.5888960096571181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,3584,0.5817306836446127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,3072,0.5000693533155653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,2048,0.3030311001671685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,2048,0.3747262159983317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,1536,0.21703467104170057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,2560,0.42828623453776044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,1536,0.3078462282816569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,1024,0.15324000517527261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,2048,0.3680115540822347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,1024,0.21969866752624512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,768,0.13024532794952393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,1536,0.28079644838968915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,768,0.18586488564809164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,1024,0.2196791172027588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,512,0.09641866551505195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,256,0.06707821951972114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,768,0.17830399672190347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,128,0.05755199988683065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,512,0.15181867281595865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,51200,12.014086405436197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,256,0.13407022423214382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,64,0.05565155877007378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,2560,0.4699440002441406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,256,0.11465599801805283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,128,0.09195999966727363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,65536,32,0.05766399701436361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,128,0.12446755833095974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,64,0.12626755237579346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,65536,32,0.12572177251180014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,512,0.15056533283657497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,65536,51200,9.026513841417101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,16384,1.9270888434516058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,51200,6.058320787217881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,16384,2.463368945651584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,12288,1.519770622253418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,65536,7.748902214898004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,16384,2.212554719712999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,10240,1.3421270582411025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,12288,1.7457769181993272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,51200,9.774151272243923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,10240,1.4371350606282551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,8192,0.9463279512193469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,12288,1.5702462726169164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,8192,1.1600862079196506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,7168,0.8538986841837565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,10240,1.3186239666408963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,51200,7.196941799587673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,7168,0.9987084070841471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,6144,0.6617742114596897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,8192,1.090727064344618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,5120,0.6144426663716634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,65536,12.71677992078993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,7168,0.9365315967135959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,6144,0.8628995683458117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,5120,0.7262541982862684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,4096,0.5653555658128526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,3584,0.43190754784478086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,5120,0.6566364500257704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,4096,0.580844455295139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,3584,0.48901775148179794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,3072,0.38976889186435276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,4096,0.5335449112786187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,2560,0.27406756083170575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,3072,0.4409804344177246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,2048,0.2232417795393202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,3584,0.47769779629177517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,3072,0.41164178318447536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,2560,0.4102328883277045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,2048,0.2973866727617052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,1536,0.1873404449886746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,2560,0.3466977808210585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,1536,0.23444000879923502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,1024,0.13007822301652697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,1024,0.18224888377719453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,1536,0.23816090159946016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,2048,0.29457778400844997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,65536,9.23501247829861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,6144,0.7716711362202963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,1024,0.17584178182813856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,256,0.053900443845325045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,768,0.1408702267540826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,768,0.1520435545179579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,128,0.0459191103776296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,256,0.09641244676378037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,256,0.10590222146775986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,512,0.12157866689893936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,64,0.03866666555404663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,128,0.10060622294743855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,32,0.040911999013688825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,128,0.07698666387134127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,64,0.1011048886511061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,51200,32,0.10144622458351983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,768,0.10813155439164902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,51200,512,0.08127199941211276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,51200,512,0.1418373319837782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,16384,0.5841653082105849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,16384,0.8989786571926541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,51200,2.2092107137044272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,65536,2.635849846733941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,12288,0.4625066651238336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,16384,0.879751099480523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,10240,0.3586346573299832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,12288,0.6949715614318848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,51200,3.1940799289279513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,8192,0.30867910385131836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,10240,0.567887994978163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,12288,0.6812284257676867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,7168,0.2429422272576226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,8192,0.43341154522365993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,10240,0.5734151204427084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,6144,0.2066782183117337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,65536,4.275110032823351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,5120,0.18352799945407441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,6144,0.3224488894144694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,5120,0.2929306560092502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,51200,2.9201217227511935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,4096,0.14389599694146052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,4096,0.2412044472164578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,7168,0.3777928882175022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,4096,0.2400897873772515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,8192,0.46133867899576825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,65536,3.71018558078342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,3584,0.12284799416859944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,3072,0.12736799981858996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,2560,0.099708444542355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,7168,0.3958408832550049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,3584,0.1895608901977539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,3072,0.18940267297956678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,2048,0.07264533307817247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,2560,0.14363555113474527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,6144,0.3490320046742757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,2560,0.15918044249216715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,1536,0.0631493330001831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,2048,0.11943111154768203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,5120,0.2862684461805555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,1024,0.043987555636299976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,1536,0.09526489178339641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,1536,0.11016711261537339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,768,0.03329599897066752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,1024,0.08580622408125137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,512,0.025778666138648987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,768,0.07344266441133288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,768,0.05982310904396904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,256,0.019672888848516677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,512,0.06128799915313721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,512,0.049626668294270836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,128,0.018343999981880188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,256,0.042769776450263135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,256,0.04901511139339871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,64,0.01566133399804433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,3584,0.21499733130137125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,128,0.040115555127461754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,128,0.041054222318861223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,3072,0.17529333962334526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,16384,32,0.015834665960735746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,64,0.04007733199331496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,32,0.03824355536037021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,16384,2048,0.13453155093722874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,16384,1024,0.07301777601242065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,16384,0.4898559782240126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,51200,1.5551591449313695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,65536,1.969771491156684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,12288,0.38056267632378477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,16384,0.756133344438341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,12288,0.5552062458462185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,10240,0.31283643510606557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,16384,0.7686515384250217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,51200,2.740754657321506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,8192,0.27019643783569336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,12288,0.5882364379035102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,10240,0.4507137934366862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,7168,0.23308444023132324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,8192,0.38003910912407773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,65536,3.3766187032063804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,10240,0.5116328663296169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,6144,0.17993511093987358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,7168,0.30621422661675346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,8192,0.4194586541917589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,6144,0.26940711339314777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,5120,0.14177955521477595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,51200,2.4416311052110458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,7168,0.34225066502888996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,5120,0.21869333585103354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,4096,0.14076356093088785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,6144,0.3025804360707601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,3584,0.1152684423658583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,4096,0.18029510974884033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,5120,0.2550746599833171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,3072,0.10204178094863892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,4096,0.21301866902245414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,3584,0.18244622813330758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,3584,0.15852533446417913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,3072,0.13791822062598333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,2560,0.11892533302307129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,2048,0.06390488810009427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,1536,0.049048887358771436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,2560,0.14389867252773708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,65536,3.128756417168511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,2048,0.09918755292892456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,2048,0.11797600322299534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,1536,0.07920889059702556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,768,0.030052443345387776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,1536,0.09747111135058933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,512,0.02241155505180359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,1024,0.07510311073727079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,1024,0.06298133399751452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,768,0.06519555383258395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,768,0.04879022306866116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,256,0.01760088900725047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,512,0.054470221201578774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,512,0.03943999939494663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,128,0.014436443646748861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,64,0.013376889129479727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,256,0.033538666036393903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,32,0.012919999659061432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,128,0.03677422139379714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,128,0.03241066800223456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,64,0.031888888941870794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,12288,32,0.031081779135598078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,2560,0.08349333206812541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,3072,0.1619608932071262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,12288,1024,0.03569333420859443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,16384,0.38759467336866593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,12288,256,0.04428889022933113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,51200,1.291203604804145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,65536,1.6514373355441625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,12288,0.32678400145636666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,16384,0.6881137953864204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,10240,0.2661653359731038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,16384,0.6943528917100695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,12288,0.5250230895148383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,12288,0.5392275386386448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,10240,0.42279911041259766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,51200,2.3651485443115234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,8192,0.22173333168029785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,10240,0.44768354627821183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,8192,0.32360267639160156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,7168,0.18983999888102213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,8192,0.3649315569135878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,7168,0.2722853289710151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,6144,0.17664178212483725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,5120,0.14497600661383733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,51200,2.192628436618381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,7168,0.31143376562330455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,6144,0.2377413378821479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,6144,0.26631198989020455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,4096,0.10988799730936687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,5120,0.234369781282213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,3584,0.09338933229446411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,4096,0.15830666489071316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,5120,0.23118310504489473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,65536,2.7922070821126304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,4096,0.18663999769422743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,3072,0.08352000183529323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,65536,2.8675653669569225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,3584,0.1717911163965861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,2048,0.0565591123369005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,3072,0.1497653325398763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,2560,0.12721333238813612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,1536,0.04351022177272373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,2048,0.08922400077184041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,2048,0.11026310920715332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,1024,0.02938577863905165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,1536,0.09008355273140801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,1536,0.07049689027998182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,1024,0.05296711126963297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,768,0.021964444054497614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,1024,0.0693733361032274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,512,0.01759111053413815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,768,0.06052977508968777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,768,0.04332355658213297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,256,0.013778666655222574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,512,0.035860445764329694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,256,0.02966488732231988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,128,0.011882666912343768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,256,0.041519999504089355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,3584,0.14551022317674425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,64,0.010330666270520952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,3072,0.12605244583553737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,128,0.033188445700539485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,128,0.02858577834235297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,2560,0.10634489191903009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,32,0.010355555348926121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,64,0.028363555669784546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,10240,32,0.027868443065219458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,10240,512,0.050424890385733716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,51200,1.0171261893378365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,65536,1.2788195080227323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,16384,0.33296177122328013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,12288,0.23526488410101998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,16384,0.5988186730278863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,12288,0.42469334602355957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,51200,1.9392488267686632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,16384,0.635500431060791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,10240,0.23109510209825304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,10240,2560,0.06971200307210286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,12288,0.4763786527845595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,65536,2.550702200995551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,8192,0.16767644882202148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,10240,0.36209776666429305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,7168,0.15441244178348118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,8192,0.27447467380099827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,10240,0.3983742131127252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,6144,0.12815199957953557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,7168,0.25507378578186035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,8192,0.31575822830200195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,7168,0.28015467855665416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,6144,0.20213511255052355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,4096,0.08835199806425308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,6144,0.24255198902553984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,5120,0.17550222078959146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,3584,0.07851199971304999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,5120,0.20225066608852812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,4096,0.13684622446695963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,65536,2.4925848642985025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,3072,0.0668577750523885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,4096,0.16861155298021105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,3584,0.12473955419328477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,2560,0.056353780958387584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,3584,0.15128089321984187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,2048,0.042641778786977134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,3072,0.13505600558386907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,2560,0.09413244326909383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,2560,0.11573066976335313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,1536,0.03568711214595371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,2048,0.07812711265352038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,2048,0.09746044211917454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,1024,0.024907555845048692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,768,0.019874667127927143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,1536,0.08106488651699491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,1536,0.06232533189985487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,1024,0.045888000064426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,768,0.039008001486460366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,768,0.05552622344758776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,512,0.015338665909237333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,256,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,5120,0.10796266794204712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,512,0.030749334229363337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,512,0.04607999987072415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,128,0.010001777774757808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,256,0.026025777061780293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,64,0.009698666632175446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,256,0.03674666749106513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,8192,32,0.010012444522645738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,128,0.03091555502679613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,64,0.025024000141355727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,32,0.024734222226672705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,3072,0.1085653305053711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,1024,0.06274133258395724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,8192,51200,1.914703157212999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,65536,1.172933366563585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,8192,128,0.025216889050271776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,51200,0.9479893578423394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,16384,0.3207937876383464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,16384,0.5177422099643284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,12288,0.24793778525458443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,16384,0.6261502371893989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,12288,0.38645066155327695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,65536,2.3386221991644964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,10240,0.21336444218953451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,51200,1.796261257595486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,12288,0.48035113016764325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,8192,0.17146755589379203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,10240,0.3226071198781331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,7168,0.14846932888031006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,8192,0.2612328794267443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,6144,0.1242106623119778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,8192,0.31524266137017143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,5120,0.10553866624832153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,6144,0.19217422273423937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,7168,0.27469778060913086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,65536,2.4250320858425565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,4096,0.08094666401545207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,6144,0.2741191122266981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,51200,1.8891137440999348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,5120,0.15717511706882054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,3584,0.06976977984110515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,5120,0.20035289393530953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,3072,0.06004710992177328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,4096,0.12794400586022273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,4096,0.16477155685424805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,2560,0.04674222071965536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,3584,0.11382577154371475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,3072,0.10138489140404595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,3072,0.1327928834491306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,2048,0.03724266754256354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,2560,0.08797066741519505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,1536,0.02870222263866001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,2560,0.11369155512915717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,1024,0.021538666552967493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,2048,0.09754488865534465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,2048,0.07228177785873413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,1536,0.07955644528071086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,1536,0.057387557294633657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,768,0.01824977828396691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,512,0.014549333188268872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,10240,0.40164889229668516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,1024,0.06267822451061673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,7168,0.2217173311445448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,768,0.054804444313049316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,768,0.03644888930850559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,128,0.009296000003814697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,512,0.028564443190892536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,512,0.043819556633631386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,64,0.008552889029184977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,256,0.02473066747188568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,32,0.009013333254390294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,128,0.02990666694111294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,128,0.023636443747414485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,64,0.023359111613697473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,32,0.022994667291641235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,3584,0.14766132831573486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,51200,0.7045964664883084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,7168,1024,0.042949332131279834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,65536,0.9577431148952908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,7168,256,0.01092711091041565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,7168,256,0.03563288847605387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,16384,0.25121066305372447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,12288,0.18995466497209337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,16384,0.5160471068488227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,12288,0.3599502245585124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,10240,0.15683910581800672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,16384,0.5824284553527832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,8192,0.13538132773505315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,12288,0.44072710143195254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,10240,0.30442312028672963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,51200,1.6338764826456706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,65536,2.0789688958062067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,7168,0.10929689142439102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,10240,0.3731164402431912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,8192,0.23600978321499297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,6144,0.09300622012880112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,7168,0.21570577886369494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,8192,0.295105775197347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,7168,0.2611502276526557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,5120,0.08107378085454305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,6144,0.17335200309753418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,4096,0.06867200136184692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,6144,0.22349243693881563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,3584,0.05922044648064507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,5120,0.1890711122088962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,4096,0.11817688412136501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,4096,0.15758666727277967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,3072,0.050287110937966235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,3584,0.10499555534786648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,65536,2.2619974348280167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,3584,0.14003911283281115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,2560,0.04072711202833388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,3072,0.0923431118329366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,2048,0.03305955396758185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,3072,0.1229555606842041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,1536,0.026740445031060114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,51200,1.7754453023274739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,2560,0.08033866352505155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,2560,0.1074133316675822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,1024,0.01959733333852556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,2048,0.091103110048506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,2048,0.06679022312164307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,768,0.016604445046848722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,1536,0.05287733342912462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,1536,0.0754879977968004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,1024,0.03990666733847724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,1024,0.05869155459933811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,512,0.012164444559150271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,256,0.01204177737236023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,768,0.05156266689300537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,128,0.010515555739402771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,512,0.04172799984614054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,512,0.02695466743575202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,256,0.03495644529660543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,6144,128,0.02928000026279026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,128,0.021949332621362474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,32,0.01034311122364468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,64,0.02198133369286855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,5120,0.1447226603825887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,32,0.021596444977654353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,65536,0.785979535844591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,51200,0.6837600072224935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,768,0.033957332372665405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,6144,64,0.010011555420027839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,16384,0.21955022546980116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,16384,0.4367617766062419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,12288,0.17753511004977754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,16384,0.5455306900872124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,65536,1.8838123745388453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,10240,0.1363119946585761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,12288,0.328745788998074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,6144,256,0.023032888770103455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,51200,1.4506648381551106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,8192,0.11042844586902195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,12288,0.4156951109568278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,7168,0.09472799963421291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,10240,0.28989511066012913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,6144,0.07792888747321235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,8192,0.216376887427436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,10240,0.3492640124426947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,8192,0.27784355481465656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,65536,2.119490729437934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,7168,0.1879884401957194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,5120,0.06912177801132202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,7168,0.2473306655883789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,4096,0.05320622192488777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,6144,0.16215466128455266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,6144,0.209206223487854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,3584,0.04816710948944092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,51200,1.6686106787787542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,3072,0.04217155443297493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,4096,0.10924088954925537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,5120,0.13362488481733534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,5120,0.1768408881293403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,4096,0.1470657719506158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,2560,0.032905777295430504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,3584,0.09905778037177192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,2048,0.02801333202256097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,3584,0.13227111763424343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,1536,0.02124799953566657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,3072,0.1160622172885471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,2560,0.10078310966491699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,2560,0.07174755467308892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,1024,0.016175111134847004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,2048,0.08635999759038289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,2048,0.060998221238454185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,768,0.01294222225745519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,1536,0.07171110974417792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,1536,0.04944444364971585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,512,0.010051555931568146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,1024,0.056030220455593534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,1024,0.03694933321740892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,768,0.04945688777499729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,768,0.030976000759336684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,128,0.007264888948864407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,512,0.03943555553754171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,512,0.02474311159716712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,64,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,256,0.03279733326699998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,256,0.021290666527218286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,32,0.006600889066855113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,5120,128,0.028119110398822363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,128,0.02025422288311852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,64,0.020224000016848247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,32,0.01995644470055898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,51200,0.46256446838378906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,5120,3072,0.084897776444753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,5120,256,0.007993777592976889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,16384,0.39855466948615176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,51200,1.2981413735283744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,12288,0.13131999969482422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,65536,1.662546687655979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,65536,0.6120977931552464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,10240,0.11720444096459283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,12288,0.29918310377332896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,16384,0.5099777645534939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,12288,0.38878666030036074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,8192,0.09033333592944676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,10240,0.2505413426293267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,65536,1.9690009223090277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,10240,0.3263431125217014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,7168,0.08306222491794162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,51200,1.546296861436632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,8192,0.19762399461534289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,6144,0.07189777824613783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,8192,0.25847021738688153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,5120,0.060702224572499595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,7168,0.17042756080627441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,7168,0.22728888193766275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,4096,0.043803556097878345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,6144,0.1451831128862169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,6144,0.19585688908894858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,5120,0.12213155958387588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,3584,0.037909332248899676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,5120,0.1652631097369724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,3072,0.03363200028737386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,4096,0.09940799739625718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,4096,0.1373280021879408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,3584,0.08794666661156549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,3584,0.12271555264790852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,2560,0.02960977620548672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,2048,0.02511377798186408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,3072,0.07872533135943942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,3072,0.10874311129252116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,1536,0.0203813330994712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,2560,0.06413422028223674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,2560,0.09453777472178142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,2048,0.05381155676311917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,1024,0.014576888746685453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,2048,0.08021955357657538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,768,0.011925333076053195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,1536,0.043953776359558105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,16384,0.17600533697340223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,512,0.009320889082219865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,1024,0.050865779320398964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,1024,0.03299644589424133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,256,0.007297777467303806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,768,0.04567022124926249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,768,0.028464890188641016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,512,0.03769866625467936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,128,0.006814222368929122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,512,0.022660444180170696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,64,0.007262222468852997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,4096,32,0.007621333003044128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,256,0.03220977716975742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,256,0.019949333535300363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,128,0.026850667264726426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,128,0.018547554810841877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,64,0.018545778261290658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,4096,32,0.01819644371668498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,16384,0.15285778045654297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,51200,0.4755439758300781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,65536,0.6214346885681152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,12288,0.12581066290537515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,16384,0.37967999776204425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,4096,1536,0.06730933321846856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,10240,0.11421422163645427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,12288,0.31339910295274526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,16384,0.5260533226860894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,51200,1.2422026528252494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,8192,0.08648977677027385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,10240,0.23563289642333984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,7168,0.073761781056722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,65536,1.5851661894056532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,10240,0.3336702187856038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,8192,0.18848089377085367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,8192,0.25768089294433594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,6144,0.06377955277760823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,5120,0.05298044284184774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,7168,0.16239910655551487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,6144,0.13807643784417048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,7168,0.2240124543507894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,51200,1.5339955223931208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,6144,0.19480621814727783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,4096,0.04287733303176033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,5120,0.11689155631595188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,3584,0.038372443781958684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,5120,0.16462932692633733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,4096,0.09511644310421413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,3072,0.03380977776315477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,4096,0.13577866554260254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,2560,0.02972088919745551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,3584,0.1218071116341485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,3584,0.08491022057003444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,2048,0.024546666277779475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,3072,0.10780444410112168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,3072,0.07555199993981256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,1536,0.020023110840055678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,2560,0.06424088610543145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,12288,0.3854773309495714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,2048,0.07943911022610135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,2048,0.05171111226081848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,1024,0.01534844438234965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,768,0.011511111425028907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,1536,0.04171999957826403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,1536,0.06669955783420138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,512,0.009737778041097853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,1024,0.05018577641910977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,1024,0.031417777140935264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,768,0.04355555441644457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,768,0.02742133372359806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,256,0.0075839997993575195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,512,0.021996445126003687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,512,0.0366266667842865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,128,0.006232000059551663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,64,0.0064693333374129395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,256,0.030943112240897283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3584,32,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,128,0.02693333393997616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,128,0.017872000734011333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,64,0.017842666970358956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,32,0.01740533279048072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,65536,1.9572319454616969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,65536,0.5183875295850966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,51200,0.34924888610839844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3584,2560,0.09343022108078003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,16384,0.1337404383553399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,16384,0.3609893321990967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3584,256,0.018552000323931377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,12288,0.0928693347507053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,16384,0.47392087512546116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,10240,0.09479644563462998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,65536,1.477134174770779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,12288,0.26946579085456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,51200,1.1543750762939453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,12288,0.36025333404541016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,10240,0.22696889771355522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,7168,0.06162666612201267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,10240,0.30316710472106934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,8192,0.17856621742248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,6144,0.05381066600481669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,8192,0.2395404444800483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,7168,0.15518221590254042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,65536,1.8202391730414496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,7168,0.2101644410027398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,5120,0.042632887760798134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,51200,1.4463396072387695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,6144,0.13149421744876438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,6144,0.18030667304992676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,4096,0.03506133291456435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,3584,0.03228266702757941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,5120,0.15377067195044622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,5120,0.11044800281524658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,4096,0.09115022420883179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,4096,0.12723555829789904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,3584,0.08114400174882677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,3072,0.028862221373452082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,2560,0.0244186669588089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,3584,0.11469777425130208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,2048,0.020202666521072388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,3072,0.07181244426303439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,3072,0.1009991102748447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,2560,0.060191108120812305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,2560,0.08842577536900838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,1536,0.015140444040298462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,8192,0.06912799676259358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,2048,0.048680888281928174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,1024,0.011411555939250521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,2048,0.07503644625345866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,768,0.009304888546466827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,512,0.00795377790927887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,1536,0.06236266427569919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,1024,0.04727377825313144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,1024,0.02984444300333659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,768,0.042131556404961475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,256,0.006826666494210561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,768,0.025421332981851365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,512,0.02086488902568817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,128,0.0059057776298787855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,512,0.035303112533357404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,64,0.005566222386227713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,3072,32,0.005621333503060871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,256,0.030759112702475652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,256,0.017840888765123155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,3072,128,0.025711110896534387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,128,0.017257778180970084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,64,0.016866667403115165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,32,0.016480889585283067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,51200,0.30733688672383624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,65536,0.4067075517442491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,16384,0.11550399992201064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,16384,0.3431511190202501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,12288,0.08443555566999648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,3072,1536,0.03941422369745042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,16384,0.4855937957763672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,51200,1.0834781858656142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,10240,0.0722364452150133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,12288,0.2586950990888807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,8192,0.05239199929767185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,12288,0.35883733961317277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,10240,0.21494932969411215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,7168,0.0453688899676005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,10240,0.30174133512708873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,8192,0.17074844572279188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,51200,1.4189252853393555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,6144,0.03930133250024583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,8192,0.23841688368055555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,7168,0.147161775165134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,5120,0.034392890002992414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,7168,0.20872888300153944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,4096,0.029846221208572388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,6144,0.17993688583374023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,65536,1.808444341023763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,5120,0.10377689202626546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,3584,0.02479644450876448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,5120,0.15215555826822916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,3072,0.022425777382320825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,4096,0.12629600365956625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,2560,0.018568888306617737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,3584,0.07627466652128431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,3584,0.11343999703725179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,3072,0.06651822063657972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,3072,0.10074844625261094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,2560,0.05716088745329115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,65536,1.3747599919637044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,1536,0.012719111310111152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,2048,0.0461422238085005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,2048,0.07412088579601712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,1024,0.01016088906261656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,1536,0.06202310985989041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,1536,0.036673777633243136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,768,0.008302222523424361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,1024,0.0469813346862793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,1024,0.028348445892333984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,512,0.007369777394665613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,768,0.04163733455869887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,768,0.024345777100986902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,256,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,512,0.01996799972322252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,512,0.03509777784347534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,128,0.005584888988071018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,256,0.017162667380438913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,256,0.029984000656339858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,6144,0.12401866912841797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,64,0.005133333305517833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,128,0.016192000773217943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,32,0.005510222166776657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,64,0.016153777639071148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,32,0.01583377851380242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2560,4096,0.0858888891008165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,65536,0.3578186564975315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2560,2048,0.015790222419632804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,51200,0.2614915635850695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,2560,0.08744177553388809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,16384,0.3299493259853787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,12288,0.0668319993548923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,16384,0.43570489353603786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2560,128,0.025736888249715168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,51200,1.003369755215115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,65536,1.2827217313978407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,10240,0.05654133028454251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,12288,0.24268621868557402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,8192,0.04619288775655958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,12288,0.3322462240854899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,7168,0.03973866502443949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,10240,0.20203377140892875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,8192,0.15963910685645208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,10240,0.2792328993479411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,6144,0.03359377715322707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,8192,0.22058488263024223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,16384,0.09420266416337754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,5120,0.02941511074701945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,7168,0.13788710700141057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,7168,0.19315732849968803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,4096,0.024503111839294434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,51200,1.3276568518744576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,6144,0.166867560810513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,6144,0.11617422103881836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,5120,0.0976417793167962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,65536,1.672035535176595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,3584,0.022590221630202398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,5120,0.141485333442688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,3072,0.019518221418062847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,2560,0.017768889665603638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,4096,0.0802968872918023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,3584,0.10616533623801337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,3072,0.09399111403359307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,3072,0.06191111273235745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,2048,0.015160888433456421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,2560,0.05182400014665392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,2560,0.08170221911536323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,2048,0.06928800212012397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,1536,0.03396177623007033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,1536,0.057799114121331104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,1024,0.009370666411187913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,768,0.008294222255547842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,1024,0.04420355624622769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,1024,0.026446221603287592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,512,0.006918222126033571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,768,0.0229751103454166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,768,0.03970222340689765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,256,0.005543111099137201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,512,0.03324710991647508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,256,0.01649777756796943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,256,0.028538667493396338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,128,0.00526577772365676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,128,0.015470221638679504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,128,0.024698666400379602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,2048,4096,0.1172800064086914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,32,0.004831111265553368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,3584,0.07135733630922106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,64,0.015271110667122735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,1536,0.011981333295504252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,32,0.01516711049609714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,2048,0.04287733303176033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,65536,0.2701217863294813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,51200,0.21326755152808297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,16384,0.07526222202512953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,2048,512,0.018811555372344125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,16384,0.3193262153201633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,12288,0.05247199866506788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,2048,64,0.004860444615284602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,51200,0.9409981833563911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,16384,0.432968881395128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,65536,1.1986018286810982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,10240,0.04658933480580648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,12288,0.23381333880954316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,8192,0.03943822118971083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,12288,0.33009065522087944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,10240,0.1934195492002699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,8192,0.15309154987335205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,10240,0.27769867579142254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,8192,0.219559113184611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,51200,1.3036817974514432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,6144,0.0281333327293396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,5120,0.024138665861553613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,7168,0.131239997016059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,7168,0.1920106675889757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,65536,1.664290640089247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,6144,0.11096266905466716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,6144,0.16496445073021784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,5120,0.09297866953743829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,3584,0.018388445178667705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,5120,0.14006666342417398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,3072,0.016318221886952717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,4096,0.07620622052086724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,4096,0.11629777484469944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,2560,0.01441422270403968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,3584,0.06776889165242513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,3584,0.1049928863843282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,2048,0.012152888708644442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,3072,0.059079110622406006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,3072,0.09272178014119466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,1536,0.009466666314336989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,2560,0.0813902219136556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,1024,0.007833778030342525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,2048,0.06856889194912381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,2048,0.04018488857481215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,768,0.0069208890199661255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,1536,0.03263288736343384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,1536,0.056596444712744824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,512,0.00589155571328269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,1024,0.043741332160102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,1024,0.025356445047590468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,256,0.004807999978462855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,768,0.03908088803291321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,7168,0.03198755449718899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,512,0.03360266817940606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,128,0.004554666578769684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,256,0.028480887413024902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,64,0.0041911109454101985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,128,0.01465777721669939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1536,128,0.02405511173937056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,32,0.00423555572827657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,64,0.014391111003028022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,32,0.014104889498816596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,65536,0.18335110611385771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,51200,0.13302666611141628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,2560,0.04907288816240099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,768,0.02198133369286855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,16384,0.048579557074440845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,256,0.015522667103343539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,65536,1.1064213646782768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,51200,0.8665493329366049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,12288,0.0380711125002967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1536,4096,0.020845333735148113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,16384,0.2853048907385932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,10240,0.02980533242225647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,16384,0.39652087953355575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,12288,0.21636444992489287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,8192,0.025645333859655593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,12288,0.302602661980523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,65536,1.518687989976671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,7168,0.022498667240142822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,51200,1.1947751575046115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,10240,0.2549582322438558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,6144,0.019896000623703003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,8192,0.14245866404639349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,8192,0.20158044497172037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,5120,0.01715377800994449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,7168,0.12261866198645698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,7168,0.17637956142425537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,6144,0.10327466991212632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,4096,0.014740443891949125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,6144,0.1518239974975586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,3584,0.013583111266295115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,5120,0.0856328871515062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,5120,0.1284897724787394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,3072,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,4096,0.10734844207763672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,4096,0.07038488652971056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,2560,0.010378667049937779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,3584,0.09648888640933567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,3072,0.05372977919048733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,3072,0.0851831105020311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,2048,0.009026666482289633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,2560,0.04521955715285408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,1536,0.007272000114123027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,2048,0.03733777668741014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,2048,0.06305955515967475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,1024,0.00629688882165485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,10240,0.18023378319210479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,1536,0.030368887715869482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,768,0.005260444349712796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,1024,0.023751111494170293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,1024,0.040844443771574236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,768,0.020582222276263766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,768,0.036672890186309814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,512,0.016978666186332703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,512,0.03156177865134345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1536,512,0.017856000198258292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,256,0.0041884444653987885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,128,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,256,0.026689777771631878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,256,0.014495111174053617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,64,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,128,0.013771555489963956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,3584,0.06243377923965454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,32,0.003559999995761447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,128,0.023065777288542852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,64,0.013415999710559845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,65536,0.15607110659281412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,1024,32,0.013414222333166333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,2560,0.0748257769478692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,51200,0.11790843804677327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,16384,0.03882666760020786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,1024,1536,0.052101333936055504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,1024,512,0.004767111192146937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,16384,0.27641601032680935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,12288,0.03072355522049798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,16384,0.39600621329413516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,10240,0.025405334101782903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,51200,0.8353875478108724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,12288,0.20879733562469482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,65536,1.0658160315619576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,8192,0.01994044416480594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,12288,0.30166400803460014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,7168,0.018551111221313477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,10240,0.1742968824174669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,6144,0.016521778371598985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,10240,0.25398490164015025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,8192,0.13670044475131565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,8192,0.20050044854482016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,51200,1.1895804935031467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,7168,0.11752000119951035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,5120,0.014119111829333834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,4096,0.012171555724408893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,7168,0.17547289530436197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,3584,0.011021333436171213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,6144,0.09889866908391316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,6144,0.1508115530014038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,5120,0.08280355400509305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,5120,0.12842044565412733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,4096,0.06753066513273451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,3072,0.010040000081062317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,4096,0.10725955830679999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,2560,0.008978666530715095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,2048,0.007956444389290279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,3584,0.05974400043487549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,3584,0.09649866819381714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,3072,0.08480533626344468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,2560,0.043495999442206494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,2560,0.07469422287411161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,1024,0.005922666854328579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,2048,0.06136800183190239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,1536,0.02882400155067444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,1024,0.022974222898483276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,768,0.004879111217127906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,1024,0.040347556273142494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,768,0.020025778147909377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,512,0.004226666771703296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,512,0.016494222813182406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,512,0.03121333320935567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,65536,1.5138915379842122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,256,0.004558222161398994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,256,0.026722666290071275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,256,0.014095111025704278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,3072,0.0511795547273424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,128,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,64,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,1536,0.051755554146236844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,128,0.013184000220563678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,32,0.0038924444880750445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,64,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,65536,0.1130711105134752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,32,0.012802666260136498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,768,0.03618933426009284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,51200,0.0894506639904446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,768,1536,0.006635555376609166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,16384,0.034703999757766724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,768,2048,0.03527644607755873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,65536,1.0235413445366752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,51200,0.8029475741916232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,12288,0.025217778152889673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,768,128,0.022690667046440974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,10240,0.020711110697852243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,16384,0.2660551071166992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,12288,0.20067911677890352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,8192,0.017830222845077515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,51200,1.1769288380940754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,16384,0.39154577255249023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,10240,0.16735466321309408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,7168,0.015844444433848064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,65536,1.5005999671088324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,10240,0.25291289223564994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,8192,0.13174045085906982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,6144,0.014118222726715935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,8192,0.19894133673773873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,7168,0.11278400156233047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,5120,0.01237422227859497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,4096,0.010461333725187512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,7168,0.1737377776039971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,6144,0.09497155745824178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,3584,0.009992000129487779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,6144,0.14993600050608316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,5120,0.07938844627804227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,3072,0.008976000050703684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,4096,0.06468266910976835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,4096,0.10623021920522054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,2560,0.008221333225568136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,3584,0.0950160026550293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,3584,0.057757331265343555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,2048,0.007249777515729268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,3072,0.08385333087709214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,1536,0.006225777582989798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,2560,0.04176177912288242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,2048,0.062090668413374156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,2048,0.0342497792508867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,1024,0.005232000102599462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,1536,0.02813777658674452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,1536,0.051426665650473706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,768,0.004610666798220741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,1024,0.022348443667093914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,1024,0.040418667925728693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,512,0.004214222232500712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,12288,0.29900532298617893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,768,0.03635111120012071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,256,0.0035422220826148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,512,0.016158221496476066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,512,0.031207998593648274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,128,0.003491555651028951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,256,0.013462222284740873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,256,0.026752889156341553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,64,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,512,32,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,128,0.022302221920755174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,128,0.013074666261672974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,64,0.0127697777416971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,65536,0.06376266479492188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,32,0.012372444073359171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,51200,0.05204000075658163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,5120,0.12816266218821207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,16384,0.01869066721863217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,3072,0.04902844296561348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,512,2560,0.07414399915271334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,12288,0.01794488893614875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,16384,0.25439733929104275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,16384,0.3903208838568793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,12288,0.19248888227674696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,512,768,0.019235556324323017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,51200,0.7665777736239963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,10240,0.016519111063745286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,8192,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,12288,0.2971431149376763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,65536,0.9778799480862088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,7168,0.012471111284361945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,10240,0.16077066792382136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,8192,0.1268426709704929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,10240,0.25122398800320095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,8192,0.1981511116027832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,6144,0.011119999819331698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,5120,0.009655999640623728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,7168,0.10803021987279256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,51200,1.1734204822116427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,4096,0.008640000389681922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,7168,0.1736755503548516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,6144,0.09029422203699748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,6144,0.1495680014292399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,3584,0.007996444072988298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,5120,0.1272239949968126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,65536,1.4904836018880208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,3072,0.007055111229419708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,4096,0.061627553568945996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,4096,0.10536799828211467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,2560,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,3584,0.05346222387419807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,3584,0.09480000204510158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,3072,0.04669600062900119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,2048,0.005653333332803514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,3072,0.08379377921422322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,1536,0.004873777843183941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,2560,0.03981066743532816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,2560,0.0720648898018731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,1024,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,2048,0.03226577904489305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,2048,0.060600890053643115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,768,0.003948444293604957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,1536,0.027149332894219294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,512,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,1024,0.02160533269246419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,1024,0.04042933384577433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,768,0.018791110979186166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,512,0.015525332755512662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,512,0.030142221185896132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,128,0.003148444410827425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,256,0.01311466677321328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,256,0.026504000027974445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,64,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,128,0.022270222504933674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,32,0.002875555513633622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,64,0.012415111064910889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,5120,0.07594399982028537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,32,0.012099555797047086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,65536,0.05308533377117581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,51200,0.04364711046218872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,1536,0.050999999046325684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,256,256,0.003391111062632667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,16384,0.01312622262371911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,51200,0.7659520043267144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,256,128,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,16384,0.25371821721394855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,12288,0.014142221874660917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,16384,0.3890364434983995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,10240,0.012448888685968188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,12288,0.2969244321187337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,65536,1.4866417778862848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,8192,0.012949333422713809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,51200,1.1686666276719835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,10240,0.16044710742102727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,7168,0.01182577759027481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,10240,0.25093865394592285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,8192,0.12514489226871067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,256,768,0.03565066721704271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,6144,0.010444444086816577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,8192,0.19786666499243843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,7168,0.10733689202202691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,7168,0.17343200577629936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,6144,0.08989510933558147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,6144,0.14908977349599203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,4096,0.007994666695594788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,65536,0.9787635803222656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,5120,0.0753564437230428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,3584,0.007592889169851939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,5120,0.12640978230370417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,4096,0.061271111170450844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,3072,0.006631111105283101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,4096,0.10492000314924453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,2560,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,3584,0.09430133634143406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,3072,0.04449333416091072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,3072,0.08354044622845119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,12288,0.19226222568088105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,2560,0.03907910982767741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,2560,0.07253511084450616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,2048,0.03236177894804213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,2048,0.060191108120812305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,1536,0.026741334133678015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,1536,0.05072089036305746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,768,0.0038968887594011095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,1024,0.021307556165589228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,1024,0.039833777480655246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,768,0.018596443865034316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,768,0.03561155663596259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,512,0.015122666954994202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,5120,0.009357333183288574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,256,0.012663111090660095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,256,0.02539377742343479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,128,0.002871111035346985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,3584,0.05359111229578654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,2048,0.005557333429654439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,128,0.012087999946541257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,1536,0.004875555634498596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,32,0.0028862222615215513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,1024,0.0042444442709287005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,32,0.011770666473441653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,65536,0.048998223410712353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,51200,0.03996710975964864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,512,0.03017510970433553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,256,0.003228444399105178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,16384,0.01517777807182736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,12288,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,16384,0.2535128858354357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,12288,0.19223644998338488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,10240,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,51200,0.765974203745524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,128,64,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,65536,0.9760328928629557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,7168,0.009312888814343346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,10240,0.1602533393436008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,6144,0.008976000050703684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,128,64,0.011924444801277585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,8192,0.12514577971564397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,5120,0.008303110798199972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,4096,0.007794666621420119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,7168,0.1072302195760939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,3584,0.0069297779765393995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,6144,0.08979555633332993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,3072,0.006589333216349284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,5120,0.0749866697523329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,2560,0.005912000106440649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,4096,0.06114666991763645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,2048,0.005202666752868229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,1536,0.004879999905824661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,3584,0.05335644549793667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,3072,0.04587733414438036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,1024,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,2560,0.038330667548709445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,768,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,2048,0.032249778509140015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,512,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,1536,0.026749332745869953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,256,0.0031991110493739447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,128,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,1024,0.02125777800877889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,768,0.018223999275101554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,512,0.01517955627706316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,256,0.012784000072214337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,32,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,128,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,65536,0.047934220896826855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,64,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,51200,0.03785066803296407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,64,32,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,16384,0.00999644481473499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,8192,0.0099982221921285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,12288,0.009013333254390294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,10240,0.00795555528667238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,16384,0.2537439929114448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,12288,0.19182311164008248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,10240,0.1601919995413886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,8192,0.012673777838548025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,7168,0.011400889191362592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,6144,0.010471111370457543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,5120,0.009370666411187913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,8192,0.12514221668243408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,7168,0.10767289002736409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,51200,0.7655297915140787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,5120,0.07525244686338636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,3584,0.00832444429397583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,3072,0.006577777779764599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,4096,0.06169866853290134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,2560,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,64,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,3584,0.053575111760033496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,2048,0.00527022240890397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,3072,0.045034666856129967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,1536,0.004581333448489507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,1024,0.0038977778620190094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,2560,0.03879022267129686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,768,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,2048,0.032257778777016535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,1536,0.026438222991095647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,512,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,1024,0.021272889441914026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,256,0.0028702221396896574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,128,0.002793777734041214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,768,0.018544000056054857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,64,0.00253866674999396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,512,0.015125332607163323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,256,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,32,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,128,0.011957333319716983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,64,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,32,0.011702222128709158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,6144,0.08984266387091742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2048,32,65536,0.9762747022840711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2048,32,4096,0.009025777379671732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,12288,1.719397332933214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,16384,2.2984720865885415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,16384,2.785881678263346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,10240,1.4239582485622828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,12288,1.9940728081597223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,10240,1.621206177605523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,8192,1.144004397922092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,7168,0.9719226625230578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,7168,1.1057582431369357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,6144,0.9169271257188586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,8192,1.2557857301500108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,5120,0.7567777633666992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,6144,0.9620052973429362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,4096,0.6723093456692166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,4096,0.6181999842325846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,5120,0.7926266458299426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,3584,0.49624888102213544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,3584,0.5442097981770834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,3072,0.4898968802558051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,2560,0.3992871178521051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,2048,0.31113510661655003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,3072,0.4652213520473904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,2560,0.42510400878058535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,1536,0.27888621224297416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,1024,0.15681866804758707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,1536,0.3054515520731608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,2048,0.40156088935004336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,768,0.15665777524312338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,51200,7.3121838039822045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,768,0.158768892288208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,1024,0.19999821980794272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,128,0.05809511078728569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,512,0.1568791071573893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,64,0.05320355627271864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,128,0.11390222443474664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,32,0.056220445368025035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,256,0.12797778182559544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,32,0.11461599667867024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,512,0.1024693316883511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,64,0.11430933740403916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,65536,256,0.08698666758007473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,65536,51200,10.673706902398003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,16384,1.8351323869493272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,12288,1.3914338217841253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,16384,2.240296893649631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,12288,1.5669270621405706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,10240,1.1460897657606337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,51200,5.5635732014973955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,10240,1.3035048378838432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,8192,0.9017546971638998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,7168,0.8175146844651965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,6144,0.7046720186869303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,8192,1.0259715186225045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,7168,0.8746497895982531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,65536,7.261179606119792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,5120,0.5782871246337891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,4096,0.47492890887790257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,5120,0.6195182270473903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,6144,0.7670888900756836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,3584,0.41725956069098574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,3072,0.32311466005113393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,3584,0.48373688591851133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,4096,0.5091386901007758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,2560,0.2930186589558919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,3072,0.37505600187513566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,2048,0.23773333761427137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,2048,0.26345600022210014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,1536,0.18441689014434814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,1024,0.11543733543819851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,768,0.09082311391830444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,1536,0.20836088392469618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,512,0.07940622170766194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,1024,0.15810044606526694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,768,0.13656889067755804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,256,0.05799555778503418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,128,0.04918755425347222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,64,0.04282222191492716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,256,0.09684889184104072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,128,0.09444889095094468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,51200,8.374671936035156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,51200,32,0.04184000028504265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,64,0.09349244170718723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,32,0.09378133217493693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,2560,0.33452712164984805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,512,0.1089093354013231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,2048,128,128,0.022321777211295232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,16384,0.5479777654012045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,12288,0.4507128927442763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,16384,0.813255098130968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,51200,1.9399030473497179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,10240,0.37454133563571507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,12288,0.6052248742845323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,51200,65536,11.269139607747396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,8192,0.29751822683546275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,7168,0.2506337695651584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,10240,0.4936061965094672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,6144,0.22248623106214735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,65536,2.5757289462619357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,7168,0.35866133371988934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,8192,0.4975546730889215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,4096,0.1483902268939548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,5120,0.20087733533647326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,6144,0.3083884451124403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,3584,0.13350044356452093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,4096,0.21435911125606963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,3072,0.10906489027871026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,5120,0.26209955745273167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,2560,0.09617066383361816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,51200,2.7857413821750217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,1536,0.05938488907284207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,2560,0.1361831161710951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,2048,0.07459821965959337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,1024,0.04204533497492472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,2048,0.10886844661500718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,768,0.03198400139808655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,512,0.023952888117896184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,1536,0.08784444464577569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,1024,0.06772889031304254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,256,0.01958933307064904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,768,0.054683556159337364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,128,0.015848888291252982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,512,0.044313778479894005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,64,0.013453333742088742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,256,0.039232889811197914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,16384,32,0.013929777675204806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,128,0.03599288728502061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,64,0.03572444452179803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,32,0.03563200102912055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,3584,0.18272711171044242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,3072,0.17416711648305258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,16384,65536,3.5756624009874134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,16384,0.45664532979329425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,51200,1.3545804553561742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,12288,0.32283910115559894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,16384,0.6546684371100532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,65536,1.837368859185113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,10240,0.2962426609463162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,12288,0.5040559768676758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,8192,0.23941156599256727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,10240,0.39681598875257706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,7168,0.21260089344448516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,6144,0.16851645045810273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,7168,0.2780595620473226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,8192,0.33602134386698407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,5120,0.15128889348771837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,4096,0.11911022663116455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,6144,0.23445333374871147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,3584,0.11088089148203532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,5120,0.22175378269619414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,3072,0.08279911014768812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,51200,2.363220426771376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,4096,0.16320889525943333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,2560,0.07890488704045613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,2048,0.06338222159279717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,1536,0.04796088735262553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,3072,0.13747466935051814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,1024,0.03529955612288581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,2560,0.10697866810692681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,768,0.02721422248416477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,512,0.020408888657887776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,2048,0.09136533074908787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,1536,0.07455022467507257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,256,0.015876443849669564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,1024,0.055939555168151855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,65536,3.0023519727918835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,128,0.012758221891191272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,64,0.011392888923486074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,768,0.04542666673660278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,256,0.031253334548738264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,128,0.029695110188590154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,64,0.031545778115590416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,32,0.030198223061031763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,16384,0.3880328867170546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,3584,0.14203288820054796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,12288,0.2991368770599365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,12288,512,0.037392000357309975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,12288,32,0.011695110963450538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,51200,1.2263724009195964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,16384,0.6066213183932835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,10240,0.2511253356933594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,65536,1.558151986863878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,8192,0.22721600532531738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,10240,0.3541128900316026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,12288,0.4299208852979872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,6144,0.15603910552130804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,5120,0.12503200107150608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,7168,0.2602506743537055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,4096,0.1017635530895657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,6144,0.208040886455112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,5120,0.18986044989691842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,51200,1.953012466430664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,3072,0.07657511366738214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,4096,0.14424355824788412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,3584,0.12619733810424805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,2560,0.06356355879041883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,2048,0.051375110944112144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,65536,2.483496983846029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,2560,0.09770399994320339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,2048,0.08118044667773776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,1536,0.04100622071160211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,1024,0.028986665937635634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,768,0.02353333267900679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,1536,0.06487022505866157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,1024,0.048455999957190625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,512,0.017144888639450073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,256,0.015776000089115567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,768,0.04111288984616598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,7168,0.1651208930545383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,128,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,64,0.009690666364298927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,512,0.032927112446890935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,256,0.028205331828859117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,32,0.00999644481473499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,64,0.02678844498263465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,32,0.02643644478585985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,10240,3584,0.08806844552357991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,3072,0.11420267158084446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,16384,0.276417785220676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,51200,0.8122640185885959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,8192,0.28040888574388295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,65536,1.146034664577908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,10240,128,0.026836444934209187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,12288,0.23047288258870444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,10240,0.19745243920220268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,16384,0.5122115347120497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,8192,0.15042666594187418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,12288,0.371872001224094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,7168,0.11342310905456543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,10240,0.3098222149742974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,6144,0.10849955346849229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,8192,0.30042489369710285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,5120,0.09240800142288208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,7168,0.23768888579474556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,4096,0.08527911371654934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,6144,0.18450933032565645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,3584,0.070214225186242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,5120,0.15472977691226536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,51200,1.7320480346679688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,3072,0.053447110785378345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,2560,0.048162665632036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,2048,0.03878755701912774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,1536,0.03170399864514669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,3584,0.12292710940043132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,3072,0.10071111387676662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,2560,0.08563466866811116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,1024,0.026644445127911035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,65536,2.196909374660916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,2048,0.07057688633600871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,512,0.014545778433481852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,1536,0.0566435522503323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,1024,0.043397333886888295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,256,0.014641778336630927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,128,0.009240888886981541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,64,0.00811644477976693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,256,0.024712888730896845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,32,0.008376888930797577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,128,0.023950222465727065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,64,0.02404088940885332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,32,0.02372088862790002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,4096,0.12373156017727321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,8192,768,0.01924711134698656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,65536,0.9395066367255317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,768,0.03731377919514974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,51200,0.8856417867872449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,8192,512,0.028743111424975928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,12288,0.20946133136749268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,10240,0.19345066282484266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,8192,0.14240622520446777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,16384,0.4688177638583713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,12288,0.3458586798773871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,10240,0.2865528795454237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,7168,0.12028533882564968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,6144,0.1126684480243259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,8192,0.2633511225382487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,5120,0.09781689114040798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,7168,0.19671644104851616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,4096,0.07268000311321683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,6144,0.16811911265055338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,3584,0.06335200203789605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,51200,1.5700462129380968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,3072,0.05450755688879225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,5120,0.14509777228037515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,2560,0.049003554715050586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,2048,0.036551998721228704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,4096,0.11903822422027588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,3584,0.10631466574139065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,1536,0.02858577834235297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,3072,0.09109510978062947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,65536,1.9691698286268446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,2560,0.07842222187254164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,768,0.017440888616773818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,512,0.013570666313171387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,2048,0.0663999981350369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,256,0.00999644481473499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,1536,0.053704000181621976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,128,0.008972444468074376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,768,0.034641779131359525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,512,0.02683999968899621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,256,0.0237128883600235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,64,0.008968888885445064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,128,0.022692445251676772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,32,0.009357333183288574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,64,0.022304000125990972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,32,0.022294221652878657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,1024,0.021425777011447485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,51200,0.7939653396606445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,7168,16384,0.24844800101386177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,65536,1.0117226706610787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,7168,1024,0.04055288765165541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,16384,0.22441776593526205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,12288,0.15185156133439806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,10240,0.15323289235432944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,8192,0.11197243796454535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,16384,0.4452346695794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,7168,0.09905422396130031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,12288,0.3366995652516683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,10240,0.29711821344163686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,8192,0.20784444279140898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,6144,0.09017155567804973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,51200,1.412151124742296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,5120,0.07837600178188749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,4096,0.0606551104121738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,3584,0.054670221275753446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,7168,0.1829733318752713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,6144,0.15889155864715576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,5120,0.13095555040571424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,3072,0.04818755719396803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,65536,1.8415217929416234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,2560,0.04109777675734626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,4096,0.10630933443705241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,2048,0.03428533342149522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,3584,0.09475555684831406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,1024,0.01804266704453362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,3072,0.08291466368569268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,768,0.014742222097184924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,2560,0.07282488875918917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,512,0.012168000141779581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,256,0.0092284447617001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,1536,0.04857422245873345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,1024,0.03626311156484816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,768,0.03118488854832119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,128,0.008291555775536431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,512,0.025314667158656653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,64,0.007359111474619971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,256,0.022553778356975977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,32,0.007553777760929531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,128,0.021019554800457422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,64,0.020968000094095867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,32,0.020601777566803824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,16384,0.19302133719126383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,51200,0.5519582430521647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,65536,0.7838524182637533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,12288,0.14850310484568277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,16384,0.39571200476752383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,10240,0.11599644025166829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,6144,2048,0.06163644128375583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,8192,0.09324889050589667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,10240,0.2445111009809706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,12288,0.3484933376312256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,7168,0.0867040024863349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,8192,0.18997511598798963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,51200,1.2798177931043837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,5120,0.061384002367655434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,7168,0.16605510976579455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,4096,0.04901599884033203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,6144,0.15210044384002686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,3584,0.04315822323163351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,3072,0.03951199849446615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,5120,0.11974310874938965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,65536,1.6286897659301758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,2560,0.034429334931903414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,4096,0.09769777456919353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,2048,0.026524444421132404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,1536,0.02124711043304867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,1024,0.016050666570663452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,3072,0.07558133204778035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,2560,0.06417422162161933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,768,0.013176889055305056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,2048,0.05884177817238701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,512,0.010239111052619087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,1536,0.04493155413203769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,256,0.008683555656009251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,1024,0.033366223176320396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,128,0.0069848886794514125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,768,0.029094222519132826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,512,0.02313511073589325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,6144,1536,0.026921777261628047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,256,0.02029511166943444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,32,0.006578666468461354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,128,0.019559999306996662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,64,0.01923733287387424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,32,0.018925334016482036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,16384,0.14002754953172472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,6144,0.08345066838794285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,51200,0.3958204322391086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,65536,0.5068195660909017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,12288,0.11160355144076878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,10240,0.09114488628175522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,16384,0.3567066722446018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,5120,3584,0.0872853332095676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,12288,0.27740711636013454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,8192,0.07207910882102118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,7168,0.06458844741185506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,10240,0.22066133552127412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,8192,0.1723813348346286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,7168,0.15082400374942356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,5120,0.0454728901386261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,51200,1.1483430862426758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,6144,0.12948800457848444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,3584,0.03465777635574341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,5120,0.10970489184061687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,3072,0.02937777837117513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,65536,1.4843644036187067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,4096,0.08944177627563477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,2560,0.025681777132882014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,3584,0.07956355810165405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,2048,0.021692444880803425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,1536,0.018061333232455783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,3072,0.07059999969270495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,2560,0.06054666969511244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,1024,0.013974222871992322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,768,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,2048,0.04962044292026096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,1536,0.040545778142081365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,1024,0.03088888857099745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,768,0.026142223013771906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,256,0.008047111332416534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,128,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,512,0.021287999219364587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,64,0.0052720002002186244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,256,0.018552000323931377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,32,0.005560889012283749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,128,0.017960889471901786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,64,0.01789688898457421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,5120,64,0.0064177778032090925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,4096,32,0.01756622228357527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,4096,0.03915822174814012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,16384,0.12572267320421007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,65536,0.513985792795817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,51200,0.3988160027398004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,12288,0.10456533564461602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,10240,0.09545599752002293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,16384,0.33805688222249347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,512,0.009335999687512716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,12288,0.2661831114027235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,8192,0.06765511300828722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,7168,0.05827999777264065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,6144,0.052849776215023465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,10240,0.24306845664978027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,7168,0.14238754908243814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,5120,0.0449022220240699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,51200,1.0910524792141385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,4096,0.03584622343381246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,6144,0.12451288435194229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,3584,0.030863109562132094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,3072,0.02693422304259406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,65536,1.395507600572374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,4096,0.08859911229875352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,2560,0.02351288828584883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,3584,0.07698044512006971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,2048,0.0196426659822464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,1536,0.01629866659641266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,3072,0.06647466950946383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,1024,0.012111999922328524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,2560,0.058224002520243325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,2048,0.047304888566335045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,768,0.010710222025712332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,512,0.008225777910815345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,1536,0.03855822152561612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,1024,0.028844445943832397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,128,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,768,0.025615110993385315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,512,0.02070577773782942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,256,0.01789155602455139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,64,0.005892444401979446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,32,0.006251555350091722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,128,0.017177777157889474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,64,0.01716800034046173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,32,0.016827555166350473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,8192,0.16428621610005698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,4096,6144,0.05519733495182461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,16384,0.10971999830669826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,12288,0.08351288901435004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,51200,0.38603467411465114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,65536,0.49012798733181423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3584,5120,0.10390222072601318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,10240,0.0802346666653951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,8192,0.058784888850318066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,16384,0.32064800792270237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,7168,0.054894222153557666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,6144,0.045066667927636035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,12288,0.2408426602681478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,10240,0.2006160020828247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,8192,0.16013244787851968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,4096,0.032051556640201144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,7168,0.13639911015828451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3584,256,0.006702222343948152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,3584,0.028071112102932397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,5120,0.09954933325449626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,51200,1.0235261917114258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,3072,0.02641955514748891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,4096,0.08195822106467353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,2560,0.020571556356218126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,3584,0.07298044363657634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,2048,0.017542221479945712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,65536,1.3012746175130208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,1536,0.01475288967291514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,1024,0.010486221975750394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,3072,0.06322489182154338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,2560,0.054309331708484225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,768,0.008974221845467886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,2048,0.0443102220694224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,512,0.007263999846246507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,256,0.005909333212508096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,1536,0.036785778072145246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,1024,0.027471999327341717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,128,0.005271111097600725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,768,0.02439555525779724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,64,0.004924444274769889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,512,0.019878221882714164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,32,0.005222222043408289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,256,0.01717333330048455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,128,0.016533333394262526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,64,0.016336888074874878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,32,0.01610666679011451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,16384,0.0967715581258138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,3072,5120,0.03783644570244683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,65536,0.3764595455593533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,12288,0.0729279981719123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,3072,6144,0.11677600277794732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,10240,0.06253421968883939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,16384,0.30296622382269967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,8192,0.04966400067011515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,12288,0.2516106764475505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,7168,0.045689778195487134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,6144,0.036751998795403376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,10240,0.1884444422192044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,8192,0.147088885307312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,5120,0.03138844503296746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,4096,0.026535999443795946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,7168,0.13095822599199083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,51200,0.952522701687283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,3584,0.024189333120981853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,6144,0.11036711268954807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,3072,0.02199466692076789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,5120,0.09330044190088908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,2560,0.018909333480728995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,4096,0.0766471094555325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,2048,0.016193777322769165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,1536,0.013183111117945777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,3072,0.05954933166503906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,1024,0.01018044435315662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,2560,0.049935112396876015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,2048,0.04151733385192023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,768,0.00868800034125646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,1536,0.0347324444188012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,1024,0.02679377794265747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,51200,0.30213867293463814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,768,0.023023999399609033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,128,0.005032000028424793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,512,0.018920888503392536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,64,0.004870222260554631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,32,0.004842666702138053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,256,0.016569778323173523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,128,0.015838222371207345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,64,0.015800888339678448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,32,0.01552088889810774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,51200,0.2316968970828586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,65536,0.31240712271796334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,16384,0.08184266752666898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,12288,0.05827022261089749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,65536,1.2137253019544814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2560,3584,0.0679911110136244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,16384,0.2997182210286458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,10240,0.05160177747408549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,8192,0.03820533222622342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,12288,0.2288151052263048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,7168,0.03791822327507867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,512,0.007368000017272101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,6144,0.029197331931855943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,10240,0.17949067221747506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2560,256,0.005922666854328579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,51200,0.8988089031643338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,4096,0.020301333732075162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,7168,0.1238880025015937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,6144,0.10417599810494317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,3584,0.01830933325820499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,65536,1.1523617638481987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,5120,0.08848177724414402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,2560,0.01459377838505639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,2048,0.012697777814335294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,4096,0.07311999797821045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,3072,0.05743733379575941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,1536,0.01038577738735411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,1024,0.00833333366447025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,2560,0.04744889007674324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,2048,0.03963466816478305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,768,0.007149332927332983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,1536,0.03262933426433139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,512,0.006155555446942647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,768,0.022319111559126113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,256,0.004899555610285865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,512,0.018205333087179396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,128,0.004555555681387584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,256,0.015810666812790763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,64,0.003909333298603694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,128,0.015132443772421943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,32,0.0042071110672420925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,64,0.01481599940194024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,5120,0.02528000043498145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,8192,0.14057600498199463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,32,0.014920888675583733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,2048,3072,0.01651822196112739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,51200,0.19621333811018202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,65536,0.24242488543192545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,16384,0.05944355328877767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,3584,0.06568888823191325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,12288,0.050741334756215416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,10240,0.03864622116088867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,8192,0.033089776833852134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,12288,0.20262132750617134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,16384,0.2691280047098796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,2048,1024,0.024987555212444727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,10240,0.167066666815016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,7168,0.02715377840730879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,6144,0.023074666659037273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,5120,0.020222221811612446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,8192,0.13084622224171957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,4096,0.017820444371965196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,3584,0.015836444165971544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,7168,0.11690666940477158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,6144,0.10708266496658325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,5120,0.08229600058661567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,3072,0.015004444453451367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,2560,0.012314666476514606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,4096,0.06698044141133626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,2048,0.010685332947307162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,3584,0.05965244770050049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,1536,0.008645333349704742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,65536,1.0428667068481445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,1024,0.007260444263617198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,3072,0.05244444476233589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,768,0.0064080001579390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,2048,0.03654311100641886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,1536,0.02993511160214742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,1024,0.023031999667485554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,768,0.020966221888860066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,128,0.0041848888827694785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,256,0.015077332655588785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,64,0.003913777983850903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,128,0.014501333236694336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,32,0.004184000194072723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,64,0.014093332820468478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,32,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,65536,0.20361688401963976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,51200,0.8180658022562662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,51200,0.15457155969407824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,16384,0.05532177620463901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,2560,0.04392888810899523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,512,0.005616888817813661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,12288,0.03869955407248603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,10240,0.03221599923239814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1536,256,0.004577777865860197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1536,512,0.01718844473361969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,8192,0.026559111144807603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,16384,0.2736835479736328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,7168,0.02368800010946062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,12288,0.19259999858008492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,6144,0.02107644412252638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,10240,0.1591377788119846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,5120,0.018564444449212816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,4096,0.015633778439627755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,8192,0.1241404480404324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,7168,0.1092568900850084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,3584,0.013768889009952545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,6144,0.09228177865346272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,51200,0.7744142214457194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,5120,0.07715644439061482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,2560,0.010752889017264048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,2048,0.009647111097971598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,4096,0.06298666530185275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,1536,0.00793511089351442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,3584,0.05555644300248888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,1024,0.006573333508438534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,3072,0.04772355490260654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,768,0.0058986664646201665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,2560,0.04105066590838962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,512,0.0052133335007561584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,2048,0.03458133339881897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,1536,0.0287715560860104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,128,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,1024,0.022302221920755174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,768,0.01958577831586202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,512,0.01660355594423082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,256,0.014118222726715935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,32,0.003866666720973121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,128,0.013591999808947245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,64,0.013439999686347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,32,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,65536,0.1378648943371243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,51200,0.11382844712999131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,16384,0.04000000158945719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,1024,65536,0.9885128868950738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,16384,0.2457804414961073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,3072,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,12288,0.027753776974148218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,10240,0.023419555690553453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,8192,0.01943199998802609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,51200,0.7431377834743924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,256,0.0042239998777707415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,12288,0.1859039995405409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,65536,0.94723023308648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,7168,0.01778044468826718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,10240,0.15285689300960964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,5120,0.01386577801571952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,8192,0.11941688590579563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,1024,64,0.0035706667436493766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,4096,0.01183199965291553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,3584,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,3072,0.009646221995353699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,7168,0.10202755530675252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,6144,0.08808355861239964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,5120,0.07419466972351074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,2560,0.008623999853928884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,4096,0.060439997249179415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,3584,0.05321422219276428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,2048,0.007477333148320516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,1536,0.0069217777086628815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,1024,0.005202666752868229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,3072,0.045758220884535045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,768,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,2560,0.03891822364595201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,512,0.004263999975389904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,2048,0.0329111119111379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,256,0.0038942222793896994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,1536,0.027445332871543035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,1024,0.021516443954573736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,128,0.0034942221310403612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,64,0.0035742223262786865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,512,0.01585244470172458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,32,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,256,0.013795555465751223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,128,0.01314133322901196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,64,0.013075555364290873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,65536,0.11049599779976739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,32,0.012512889173295764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,51200,0.08693333466847737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,16384,0.03441155619091458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,12288,0.027097778187857732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,10240,0.023575110567940608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,16384,0.23586400349934897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,12288,0.17807911501990425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,8192,0.019663110375404358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,768,6144,0.0158942225906584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,7168,0.017845332622528076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,6144,0.016525333126386006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,8192,0.11450578106774224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,51200,0.7102177937825521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,5120,0.013582222163677216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,4096,0.011337777806652917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,6144,0.08434222141901652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,65536,0.907573382059733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,3584,0.010701333483060202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,3072,0.009640889035330879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,5120,0.07136178016662598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,4096,0.05715733104281955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,2560,0.008346666892369589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,768,768,0.018887110882335238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,3584,0.050236443678538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,2048,0.007284444239404466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,3072,0.042504890097512134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,1536,0.006276444428496891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,1024,0.005534222142563925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,2560,0.037018666664759316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,768,0.004870222260554631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,512,0.004510222209824456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,1536,0.026612444056404963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,1024,0.020948444803555805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,256,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,128,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,768,0.0188044442070855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,512,0.015463999576038785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,64,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,512,32,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,128,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,64,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,32,0.012297777665985955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,10240,0.14660355779859754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,51200,0.054141332705815635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,16384,0.01920355525281694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,7168,0.09876888990402222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,12288,0.016711110870043438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,10240,0.01835555500454373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,16384,0.2248915566338433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,8192,0.013288000391589271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,12288,0.16971288786994088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,10240,0.13989688290490046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,51200,0.6762684186299642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,7168,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,6144,0.010888888604111142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,2048,0.03151377704408433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,65536,0.8623421986897787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,5120,0.00942755573325687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,4096,0.008280889027648503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,7168,0.09352533022562663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,6144,0.08006399869918823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,512,256,0.013456888496875763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,5120,0.06733422146903144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,3072,0.00720888872941335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,4096,0.05437689026196798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,2560,0.006567111031876669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,2048,0.005558222118351195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,65536,0.06577510966195001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,3584,0.047488000657823354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,3072,0.04073422153790792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,1536,0.00508711114525795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,2560,0.0354968872335222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,2048,0.03086400032043457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,768,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,512,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,1536,0.02552622225549486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,1024,0.01994755533006456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,256,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,128,0.0028808888875775864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,768,0.01789777808719211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,512,0.01496444476975335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,256,0.012950222525331708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,32,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,128,0.012101333174440594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,64,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,65536,0.048039999273088246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,32,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,51200,0.039080000585979886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,16384,0.016891555653678048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,3584,0.007595555649863348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,12288,0.01387111097574234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,16384,0.22471732563442656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,10240,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,1024,0.004543999830881755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,12288,0.16933688852522108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,51200,0.6758142047458224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,8192,0.01000711073478063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,10240,0.13958933618333605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,7168,0.010382222632567087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,65536,0.8613653182983398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,6144,0.009685333404276106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,5120,0.00902133352226681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,256,64,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,8192,0.10794222354888916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,7168,0.09332178036371867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,6144,0.07928178045484754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,3584,0.007313778003056844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,5120,0.06692533360587226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,3072,0.006568888823191325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,2560,0.0059004442559348206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,4096,0.053605334626303784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,2048,0.005535999933878581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,3584,0.04715555575158861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,1536,0.004857777721352047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,3072,0.04136000076929728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,1024,0.004176889028814104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,768,0.003867555409669876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,2560,0.03478577733039856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,256,8192,0.10885244607925415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,512,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,2048,0.030512889226277668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,1536,0.025403555896547105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,1024,0.019899555378490023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,128,0.002954666606254048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,64,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,768,0.017851556340853374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,32,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,256,0.012771555946932899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,65536,0.04495999879307217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,128,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,64,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,51200,0.035058667262395225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,32,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,16384,0.013122667041089801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,12288,0.16964533593919542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,10240,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,4096,0.0079297779334916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,8192,0.010013333625263637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,51200,0.6754239930046929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,10240,0.13973511589898005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,7168,0.00980000032318963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,65536,0.8624186515808105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,6144,0.00902133352226681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,8192,0.10804444551467896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,5120,0.008991111483838823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,4096,0.007630222373538547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,7168,0.09212088584899902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,128,256,0.003198222153716617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,3584,0.006955555743641323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,6144,0.07936533292134602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,3072,0.006567111031876669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,5120,0.06726577546861437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,128,512,0.014855111638704935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,2560,0.005894222193294101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,4096,0.05375022358364529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,3584,0.04692000150680542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,2048,0.0053431110249625305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,1536,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,2560,0.034576889541414045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,1024,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,768,0.003671110918124517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,2048,0.030193779203626845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,1536,0.02512888941499922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,512,0.003567111161020067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,256,0.0032231110251612137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,1024,0.019893333315849304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,768,0.017648888958825003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,128,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,512,0.014478221535682678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,32,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,256,0.012771555946932899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,128,0.012040889097584618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,65536,0.041301333241992526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,64,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,32,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,51200,0.03356533249219259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,16384,0.010378667049937779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,12288,0.00920800036854214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,16384,0.22451644473605684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,12288,0.16934933927324083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,10240,0.008558221989207799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,8192,0.007711999946170383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,10240,0.1398906707763672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,51200,0.6756533516777886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,8192,0.10797155565685695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,7168,0.007330666813585494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,6144,0.010421333213647207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,65536,0.8626080089145236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,5120,0.01036000003417333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,4096,0.009295110901196798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,7168,0.09220977624257405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,6144,0.07926488584942289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,3584,0.008401778009202745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,16384,0.2245075437757704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,3072,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,5120,0.06694933440950182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,2560,0.006707555717892117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,4096,0.053567998939090304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,2048,0.006236444330877728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,3584,0.04691733254326714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,1536,0.004536889079544279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,3072,0.04038222299681769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,2560,0.0346666673819224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,2048,0.029934220843844946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,768,0.003583999971548716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,1536,0.025368889172871906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,1024,0.01994311147265964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,256,0.003148444410827425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,512,0.014840000205569796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,128,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,256,0.01239733315176434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,128,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,64,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,64,3072,0.04038844505945841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,64,12288,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,32,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,1024,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1793,32,512,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1793,32,768,0.01776000029510922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,16384,2.22017945183648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,12288,1.7133910920884874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,12288,1.9255385928683812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,16384,2.709742228190104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,10240,1.364201757642958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,16384,2.412445280287001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,10240,1.5794995625813801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,8192,1.1008275349934895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,12288,1.822231928507487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,10240,1.4526604546440973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,7168,0.8832444614834256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,8192,1.2640053431193035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,7168,1.0724702411227756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,51200,7.087915632459853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,8192,1.1470186445448134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,6144,0.894004397922092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,6144,0.9186275270250109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,5120,0.7128533257378472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,7168,0.9934132893880209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,4096,0.551470226711697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,5120,0.7808417744106717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,6144,0.8258222473992242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,3584,0.533880869547526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,3584,0.524819533030192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,5120,0.7045920160081652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,4096,0.6457680066426595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,3072,0.45252535078260636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,4096,0.5699191093444824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,2560,0.3295182122124566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,3072,0.4533608754475911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,3584,0.5016942024230957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,2560,0.506390200720893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,3072,0.4417777856190999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,2048,0.28043466144137913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,2560,0.37488889694213867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,2048,0.3284408781263563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,1536,0.21093066533406576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,1024,0.14744888411627874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,1536,0.2667982313368055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,51200,10.333693610297308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,768,0.11153244972229004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,2048,0.3138391176859538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,1536,0.24938578075832793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,1024,0.23025332556830513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,512,0.08186133040322198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,768,0.1685333384407891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,256,0.05957066350513034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,768,0.16075111760033503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,512,0.1311804453531901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,512,0.13549066914452448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,128,0.05542666713396708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,256,0.11865599950154622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,64,0.047930667797724404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,128,0.0862542192141215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,65536,32,0.04916888806555006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,128,0.11030489206314087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,64,0.11140888267093235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,65536,32,0.1117111047108968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,1024,0.19231200218200684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,256,0.1089937753147549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,65536,51200,7.769929673936631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,16384,1.7755520078870985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,16384,2.1826843685574002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,51200,5.380171457926433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,12288,1.3076978259616427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,65536,7.008599175347222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,16384,1.9480018615722656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,12288,1.5045057932535808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,10240,1.1684391233656142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,51200,8.003690083821615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,10240,1.286277347140842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,12288,1.3955769009060328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,8192,0.8886515299479166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,10240,1.1661323971218533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,7168,0.7643484539455838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,8192,0.9837769402398003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,6144,0.6609937879774306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,7168,0.8641377554999458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,8192,0.9294409222073026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,65536,10.740264044867622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,6144,0.7143999735514323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,7168,0.8330257733662924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,5120,0.5465395715501573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,4096,0.37533066007826066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,5120,0.6702542304992676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,3584,0.34224266476101345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,51200,6.242205301920573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,4096,0.48951111899481875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,3584,0.43054845598008895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,5120,0.566971566942003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,6144,0.6764782269795736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,4096,0.47501065995958114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,3072,0.33692532115512425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,2560,0.26355287763807506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,3072,0.3646879990895589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,2048,0.22400267918904623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,2560,0.3258391221364339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,3072,0.3574853208329942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,1536,0.17945599555969238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,2048,0.2862328953213162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,2560,0.3093786769443088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,2048,0.2554871241251628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,1024,0.12604355812072754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,1536,0.2064159976111518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,768,0.09168889125188191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,1024,0.1606986655129327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,1536,0.20571288797590467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,1024,0.16089067194196913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,512,0.0653688907623291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,256,0.048306667142444186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,768,0.13340266545613608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,768,0.14599733882480198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,128,0.03934577769703335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,512,0.10962400171491836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,512,0.10828710926903619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,256,0.09455644422107273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,256,0.0877315534485711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,32,0.037238223685158625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,51200,64,0.03563377923435635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,128,0.09418844514422947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,128,0.07007200188106961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,64,0.08967022101084392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,51200,32,0.08978933095932007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,65536,8.094974093967014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,51200,3584,0.41409866015116376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,16384,0.6790062056647407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,16384,0.7806497679816352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,12288,0.4187146557701959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,51200,1.9898541768391926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,65536,2.553661346435547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,12288,0.5847173266940647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,16384,0.7986817889743381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,10240,0.28743643230862087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,51200,2.744783189561632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,8192,0.26080356703864205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,10240,0.4751288625929091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,12288,0.6092906528049046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,65536,3.724596235487196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,10240,0.5063609017266167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,8192,0.3890684445699056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,7168,0.25753598743014866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,6144,0.17353599601321748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,8192,0.40060443348354763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,7168,0.3451271057128906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,51200,2.563494152492947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,6144,0.2944524553087023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,5120,0.1956942213906182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,7168,0.3505360020531549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,4096,0.14949956205156115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,6144,0.3036328951517741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,5120,0.23783556620279947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,4096,0.21015911632113984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,3584,0.1329475508795844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,5120,0.2718737655215793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,3072,0.1202933390935262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,4096,0.21277333630455864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,3584,0.1685484382841322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,3584,0.19189955128563774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,2560,0.10167022546132405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,3072,0.1706062157948812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,2048,0.0616497794787089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,65536,3.3093831804063587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,2560,0.12713778018951416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,1536,0.04787466592258877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,2560,0.14543822076585558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,2048,0.10862666368484497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,1024,0.034713778230879046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,2048,0.12485688262515598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,1536,0.1017448902130127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,768,0.03049422303835551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,1024,0.06504178047180176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,1024,0.08192355765236749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,512,0.02906044324239095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,768,0.06875199741787381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,1536,0.0882871084743076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,768,0.053448001543680825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,128,0.016671111186345417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,512,0.059531556235419385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,512,0.043453332450654775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,256,0.04823644293679131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,256,0.03809244434038798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,32,0.014766222900814481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,128,0.03527733352449205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,16384,128,0.03892711136076186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,64,0.03568799959288703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,32,0.03458311160405477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,16384,3072,0.15309245056576198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,256,0.021344888541433547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,16384,64,0.014099554883109199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,16384,0.43144623438517254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,51200,1.4468729231092665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,16384,0.638705783420139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,65536,1.9354799058702257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,12288,0.37104090054829914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,10240,0.28998133871290416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,12288,0.47013245688544375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,51200,2.2646257612440324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,16384,0.6826817724439832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,8192,0.21283288796742758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,12288,0.5342115296257867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,65536,2.946024788750542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,10240,0.41997867160373265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,8192,0.30658043755425346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,7168,0.2007662190331353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,10240,0.4312124517228868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,6144,0.157679107454088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,7168,0.2750479910108778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,8192,0.35947733455234104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,5120,0.13285956117841932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,7168,0.3084533214569092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,4096,0.10668622122870551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,51200,2.148411644829644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,6144,0.26231198840671116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,5120,0.1942408879597982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,3584,0.10098310973909165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,4096,0.1561653349134657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,5120,0.22769334581163195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,3072,0.08436889118618435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,4096,0.20690755049387613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,3584,0.13908799489339194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,3584,0.16591555542416042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,2560,0.07304088936911689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,3072,0.12230311499701606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,3072,0.14748444822099474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,2048,0.05972799989912245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,1536,0.04319644305441114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,2560,0.12740888860490587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,2560,0.11143022113376194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,2048,0.0914177762137519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,1024,0.03157866663402981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,2048,0.10862044493357341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,1536,0.07095555464426677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,768,0.023131555981106226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,1536,0.08949955304463704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,1024,0.05617955658170912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,1024,0.07004888852437337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,768,0.04435999857054817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,768,0.06076622009277344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,256,0.01834755473666721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,512,0.035635554128222995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,512,0.051015112135145396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,128,0.016421332955360413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,6144,0.22932622167799208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,256,0.03104355600145128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,256,0.0421706669860416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,64,0.015227556228637695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,32,0.015840000576443143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,128,0.03361777795685662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,128,0.029232889413833618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,64,0.029178665743933782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,12288,32,0.028785778416527644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,12288,65536,2.7614996168348522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,12288,512,0.01864177816443973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,51200,0.9414968490600586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,16384,0.3405591117011176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,65536,1.2808222240871854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,12288,0.27461332745022243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,16384,0.6225831243726943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,12288,0.44704177644517684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,51200,1.9667474958631728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,16384,0.6244639820522732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,10240,0.22369244363572863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,12288,0.46818309360080296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,8192,0.18075733714633516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,10240,0.3541404406229655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,7168,0.1529973347981771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,10240,0.38952088356018066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,8192,0.27101066377427846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,6144,0.1288506719801161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,8192,0.33149955007765025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,7168,0.23733245001898873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,5120,0.11397511429256862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,7168,0.2729004489050971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,51200,1.9090834723578558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,4096,0.09588177998860677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,6144,0.20227289199829102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,6144,0.23966312408447266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,3584,0.06891200277540419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,65536,2.4793805016411676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,4096,0.14323466353946263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,4096,0.16758844587537977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,3072,0.06947377655241224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,3584,0.12496977382236057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,65536,2.5672969818115234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,2560,0.06422399812274508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,2048,0.04738577869203356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,3072,0.11098044448428684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,3072,0.13293422593010798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,1536,0.0365626679526435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,2560,0.11561777856614854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,2048,0.08163644207848443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,2048,0.09954577684402466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,1024,0.02511377798186408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,1536,0.08196622133255005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,1536,0.06282933553059895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,768,0.019948444432682462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,1024,0.04760711060629951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,1024,0.06553066439098783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,512,0.015524443652894763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,768,0.039460443788104586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,768,0.05657244390911526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,256,0.012076444096035428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,512,0.03155288762516446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,512,0.04745599958631727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,5120,0.17082577281528047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,128,0.010955555571450127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,256,0.03811288873354594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,256,0.027582221561008032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,64,0.009703111317422655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,10240,32,0.009663999908500248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,128,0.026864889595243666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,5120,0.20049333572387695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,64,0.02609599961174859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,32,0.02610133257177141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,3584,0.1496560043758816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,10240,2560,0.09486311011844212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,16384,0.29237866401672363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,51200,1.021267573038737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,65536,1.2010133531358507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,10240,128,0.031201776531007554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,12288,0.23792711893717447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,16384,0.4882826805114746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,10240,0.20060177644093832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,12288,0.36238667700025773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,51200,1.6676941977606878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,8192,0.16750310526953804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,16384,0.6111911137898763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,10240,0.3084542221493191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,12288,0.44298932287428117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,65536,2.1276062859429254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,7168,0.14162400033738878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,10240,0.36237867673238117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,8192,0.2566044330596924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,6144,0.1229226721657647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,7168,0.21180533038245308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,8192,0.293175114525689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,5120,0.1001395583152771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,6144,0.18230311075846353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,7168,0.25572265519036186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,51200,1.7547964519924586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,4096,0.08668888939751519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,6144,0.2210986614227295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,3584,0.06896533568700154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,5120,0.19085778130425346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,4096,0.12159555488162571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,4096,0.15546666251288518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,3072,0.06384711133109199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,3584,0.1101564433839586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,2560,0.05497511227925619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,3584,0.141865783267551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,3072,0.09708178043365479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,3072,0.12428177727593316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,2048,0.04486933350563049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,1536,0.03252799974547492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,2560,0.08382133642832439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,2560,0.10843644539515178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,1024,0.023570666710535686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,2048,0.06902844376034208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,2048,0.09223466449313694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,1536,0.05529333485497368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,768,0.02060622142420875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,1024,0.060255997710757785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,1024,0.04211466511090597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,512,0.018017777138286166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,768,0.05299911234113905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,768,0.03548355566130744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,256,0.013449778159459433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,512,0.028282665544086035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,512,0.04360533422893948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,128,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,256,0.03563111027081808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,256,0.02421244482199351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,64,0.010679110884666443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,128,0.02345866627163357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,8192,32,0.011258666714032492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,128,0.03086755673090617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,64,0.02332177758216858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,32,0.023224888576401606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,65536,2.241323471069336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,8192,1536,0.07687199778027005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,65536,0.9173919889662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,51200,0.7664808697170682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,16384,0.25807287957933217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,12288,0.1967866685655382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,8192,5120,0.14962311585744223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,16384,0.478074656592475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,12288,0.360318210389879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,10240,0.17428799470265707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,12288,0.4110115634070502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,16384,0.5651715596516927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,51200,1.5308151245117188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,65536,1.9410603841145833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,8192,0.14406843980153403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,10240,0.2858640087975396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,7168,0.1228968832227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,8192,0.22016621960533989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,10240,0.3464799986945258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,6144,0.11096000009112889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,8192,0.2744684484269884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,7168,0.19237155384487578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,5120,0.08548355764812893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,7168,0.24086311128404406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,4096,0.07032533486684163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,6144,0.16420888900756836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,6144,0.20782577991485596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,5120,0.13976621627807617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,3584,0.06068355507320828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,5120,0.17699289321899414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,3072,0.055252446068657764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,4096,0.15435289012061224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,51200,1.644765324062771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,2560,0.0440977778699663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,3584,0.10171288914150661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,3072,0.09028000301784939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,3072,0.11747288703918457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,65536,2.093478308783637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,2560,0.07807822359932794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,2560,0.10458044211069743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,2048,0.0643120010693868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,1024,0.021182222498787776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,1536,0.07414488659964667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,1024,0.03895111216439141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,1024,0.05740977658165825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,768,0.0173653331067827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,768,0.05073066552480062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,768,0.03354133168856303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,512,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,512,0.04163555635346307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,512,0.02696888811058468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,256,0.010382222632567087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,4096,0.11457867092556423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,3584,0.13189778063032362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,256,0.02313511073589325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,128,0.009347555538018545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,256,0.03427822060055203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,2048,0.0355368885729048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,64,0.008671110702885522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,32,0.008972444468074376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,7168,1536,0.027685332629415724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,128,0.029816001653671265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,128,0.021985777550273474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,64,0.02199466692076789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,7168,2048,0.08700533045662774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,32,0.02165866725974613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,7168,1536,0.05193600058555603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,16384,0.252895991007487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,51200,0.7324293454488119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,65536,0.897758271959093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,16384,0.4228382110595703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,12288,0.18864533636305067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,12288,0.3158080048031277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,51200,1.3877911037868922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,16384,0.5225813123914931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,10240,0.15920889377593994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,12288,0.3957422309451633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,8192,0.12940443886650935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,65536,1.7797421349419489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,10240,0.2628542317284478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,7168,0.11031644211875068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,8192,0.20786578125423857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,7168,0.17763022581736246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,6144,0.1015697783894009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,51200,1.5341173807779949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,7168,0.22478577825758192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,5120,0.08322666751013862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,6144,0.15219822194841173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,6144,0.19289067056443956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,5120,0.1287226676940918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,4096,0.0631928907500373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,65536,1.9575102064344618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,5120,0.16640533341301814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,3584,0.05565155877007378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,3072,0.0514977773030599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,4096,0.10533599721060859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,4096,0.13760888576507568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,3584,0.09411822424994574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,3584,0.12410222159491645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,2560,0.04158044523662991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,2048,0.029913776450686987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,3072,0.08239733510547213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,3072,0.1096000009112888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,2560,0.0963297751214769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,1536,0.024217777782016333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,2048,0.058824002742767334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,2048,0.08163377973768446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,1024,0.017647110753589206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,1536,0.06875110997094049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,10240,0.32211732864379883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,768,0.01483022173245748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,8192,0.2739146550496419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,1536,0.04778844449255201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,1024,0.036349332994884916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,1024,0.05455733338991801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,512,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,256,0.009091555244392818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,768,0.031151112582948472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,128,0.00793688909875022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,512,0.024756444825066462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,512,0.039800001515282526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,256,0.021543999512990315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,256,0.03325422273741828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,64,0.007069333559936947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,6144,32,0.0069751110341813825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,128,0.02864711152182685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,64,0.02057422200838725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,32,0.020283554991086323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,2560,0.07189866569307116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,51200,0.48070844014485675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,65536,0.6752435366312662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,16384,0.17903110716078016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,6144,768,0.04669688807593452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,16384,0.4331582122378879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,12288,0.1281368864907159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,6144,128,0.02093155516518487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,51200,1.2542568842569988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,10240,0.11910488870408799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,12288,0.29626666174994576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,16384,0.4883777830335829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,65536,1.6328372955322266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,8192,0.08949777815077041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,12288,0.35630043347676593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,10240,0.2387155426873101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,7168,0.07773955663045247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,10240,0.2966853247748481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,8192,0.1897439956665039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,6144,0.06631111436420016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,5120,0.05513866742451986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,8192,0.23705156644185385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,7168,0.1625279982884725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,7168,0.20699466599358451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,6144,0.14018666744232178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,6144,0.18115733729468453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,4096,0.048736890157063804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,5120,0.12147911389668782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,3584,0.04292444388071696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,4096,0.09734577602810329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,4096,0.12872178024715847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,65536,1.8076754675971136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,51200,1.4204764895968969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,3072,0.03528799944453769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,3584,0.11521422863006592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,3584,0.08736977974573772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,2048,0.02520711057715946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,3072,0.10218844148847793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,2560,0.0639680027961731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,1536,0.01960444450378418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,2048,0.054104000329971313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,2048,0.07710133658515082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,1024,0.014639111028777229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,1536,0.04422488808631897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,1536,0.06462755468156603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,768,0.012420444852775998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,1024,0.033815999825795494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,1024,0.051065779394573636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,512,0.009418666362762451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,768,0.028331554598278467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,768,0.04435555471314324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,256,0.007600000335110559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,512,0.023039110832744177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,512,0.03694222370783488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,128,0.0069351109365622205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,5120,0.15355111493004694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,256,0.019948444432682462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,256,0.03224710954560174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,64,0.006280888699822956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,32,0.0063786668082078295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,128,0.027683556079864502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,128,0.019588443968031142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,5120,2560,0.031189332405726116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,64,0.0192239996459749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,32,0.019096000327004325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,5120,3072,0.07604622178607516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,5120,2560,0.08920977512995402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,16384,0.15720444255405003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,51200,0.4795857535468207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,65536,0.5909297731187608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,12288,0.12827555338541666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,16384,0.3509395652347141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,12288,0.278839111328125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,16384,0.4788115819295247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,10240,0.10648710860146417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,51200,1.1396267149183485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,12288,0.3522977828979492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,8192,0.08412622080908881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,65536,1.449702262878418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,10240,0.22366666793823242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,8192,0.17112178272671172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,10240,0.3036266697777642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,8192,0.23352265357971191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,6144,0.06269866890377469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,7168,0.14904622236887613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,51200,1.4031182395087347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,5120,0.052221334642834134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,7168,0.20475378301408556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,4096,0.0444524453745948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,6144,0.12809333536359999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,6144,0.17837688657972547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,3584,0.03943199912707011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,5120,0.10840888818105061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,5120,0.15262222290039062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,65536,1.7925652398003473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,3072,0.034224887688954674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,4096,0.08908710877100627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,4096,0.12678310606214735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,2560,0.029022223419613306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,3584,0.07854488823148939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,3584,0.11347111066182454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,2048,0.02482844392458598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,3072,0.07074933581882052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,3072,0.10099377897050645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,2560,0.0602160029941135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,1536,0.01975911193423801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,2560,0.08780444330639309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,1024,0.015185778339703878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,2048,0.0490862230459849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,768,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,1536,0.040377779139412776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,1536,0.06350844436221652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,512,0.009947555760542551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,1024,0.04794222116470337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,1024,0.030012445317374334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,7168,0.07460533248053657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,256,0.007784888976150089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,768,0.026122666067547266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,128,0.006559111177921295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,512,0.03628977802064683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,256,0.030864887767367895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,64,0.007307555940416124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,128,0.027077333794699773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,128,0.017900443739361234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,4096,32,0.01034222212102678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,64,0.017895110779338412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,32,0.017277333471510146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,65536,0.4551253318786621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,2048,0.07566222217347887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,51200,0.3775431050194635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,4096,768,0.04198844565285576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,512,0.021290666527218286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,4096,256,0.018449778358141582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,16384,0.14522400167253283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,12288,0.10628800259696113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,65536,1.3532578150431316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,16384,0.33281421661376953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,10240,0.07638844516542223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,12288,0.26414844724867076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,16384,0.43073333634270566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,8192,0.06969955232408312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,12288,0.3278435601128472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,51200,1.0699084599812825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,10240,0.20713067054748535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,10240,0.27664444181654185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,7168,0.056121779812706836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,8192,0.16342311435275608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,6144,0.049583110544416636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,7168,0.14106310738457575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,65536,1.6536436080932617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,8192,0.21644888983832467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,5120,0.04153777824507819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,7168,0.19162400563557944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,6144,0.12127910719977485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,4096,0.03165510959095425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,3584,0.02932000160217285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,5120,0.1415839989980062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,5120,0.10282933049731785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,51200,1.3052186965942383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,4096,0.08547377586364746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,3072,0.025841777523358662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,4096,0.11768799357944065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,2560,0.02124888863828447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,3584,0.07607555389404297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,2048,0.018053332964579265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,3584,0.10594399770100911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,3072,0.06623999940024482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,3072,0.09429244200388591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,1536,0.015300444430775113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,2560,0.05647644731733534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,2560,0.08256622155507405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,1024,0.01126488877667321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,768,0.009477333062224919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,2048,0.07129066520267062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,2048,0.04606489009327359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,1536,0.038351999388800725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,1536,0.0602017773522271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,1024,0.045888000064426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,1024,0.028487109475665625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,256,0.0068604445291890045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,768,0.04078222314516703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,768,0.025029333101378545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,128,0.005960000058015187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,512,0.034522665871514216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,512,0.020296888218985665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,64,0.005613333235184352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,256,0.017851556340853374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,256,0.030138668086793687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,32,0.0059075554211934405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,128,0.026198221577538386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,128,0.01724799970785777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,64,0.01685066686736213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3584,32,0.016543999314308167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3584,6144,0.16540355152553982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,51200,0.3619617886013455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,65536,0.47257423400878906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,16384,0.1277866628434923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,12288,0.09823111030790542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,16384,0.3353404468960232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3584,512,0.007924444145626491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,12288,0.2396399974822998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,16384,0.4472488827175564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,10240,0.07247644662857056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,51200,1.0064356062147353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,12288,0.3311591148376465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,10240,0.19828889105055067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,7168,0.05124533176422119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,10240,0.273855103386773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,8192,0.15565155612097845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,6144,0.04457599918047587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,8192,0.2162604464424981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,7168,0.1344675620396932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,51200,1.2895563973320854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,7168,0.19167199399736193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,5120,0.03722666700681051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,6144,0.11652355723910862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,4096,0.030978666411505804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,6144,0.1647688945134481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,5120,0.09877689017189874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,3584,0.02867199977238973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,65536,1.6471537484063044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,4096,0.08124088578754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,4096,0.11738844712575276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,3584,0.10549866490893894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,3072,0.06368977493709989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,2560,0.021543110410372417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,8192,0.05571644173728096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,2560,0.053616000546349414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,2048,0.017543110582563613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,2048,0.044417778650919594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,2048,0.07094844182332356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,1536,0.01423733267519209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,5120,0.14078222380744085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,1536,0.036257776949140764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,3072,0.025057777762413025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,1024,0.01033333357837465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,1536,0.058125330342186816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,3584,0.07244088914659289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,768,0.008650666309727563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,1024,0.045165333482954234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,1024,0.027482666903071936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,512,0.007267555428875818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,768,0.040561778677834406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,3072,0.09389866722954644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,256,0.005943999936183293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,512,0.019515555765893724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,128,0.00553955551650789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,65536,1.2935795254177518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,2560,0.0820302234755622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,256,0.01719999975628323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,64,0.004909333255555895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,128,0.016511999898486666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,128,0.025478222303920325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,64,0.01649688846535153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,32,0.015803555647532146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,65536,0.31688443819681805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,51200,0.26020267274644643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,3072,768,0.02375288969940609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,512,0.03394666645261977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,16384,0.09826044241587321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,3072,256,0.029842668109469946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,3072,32,0.00489777781897121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,12288,0.07318222522735596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,65536,1.195185767279731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,16384,0.2993084324730767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,10240,0.06383377975887723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,16384,0.39402490191989475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,12288,0.2996986707051595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,8192,0.049824890163209706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,10240,0.1874764495425754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,51200,0.9555724461873373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,7168,0.04149333304829068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,10240,0.2478097809685601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,6144,0.03703466720051236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,8192,0.14663910865783691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,8192,0.19770399729410806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,7168,0.17458577950795492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,5120,0.031071109904183283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,6144,0.10929244756698608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,51200,1.1830097834269206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,6144,0.15125155448913574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,4096,0.02509422269132402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,3584,0.02184177769554986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,5120,0.12997155719333225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,4096,0.07638044489754571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,4096,0.1079368856218126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,3072,0.02019733356104957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,3584,0.09736533297432794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,3584,0.06760888629489474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,2560,0.017774222625626456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,3072,0.08687733279334174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,3072,0.058563556936052114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,2048,0.014829332629839579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,2560,0.04988444513744778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,2560,0.07647999789979723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,1536,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,12288,0.2254257731967502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,2048,0.04101244608561198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,1024,0.009367110828558603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,2048,0.06592355834113227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,768,0.008291555775536431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,1536,0.033604443073272705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,1024,0.0424924459722307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,1024,0.026047110557556152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,512,0.006960888703664144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,768,0.022631110416518316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,256,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,7168,0.1288657718234592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,512,0.018811555372344125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,128,0.004870222260554631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,256,0.028817776176664565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,128,0.015592000550693937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,5120,0.09303022093243069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,64,0.004574222283230888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,128,0.02474400069978502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2560,32,0.004870222260554631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,64,0.015460444821251763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,32,0.015465777781274585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,65536,0.33417865965101456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,1536,0.05382755398750305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,51200,0.264061344994439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,768,0.0380328893661499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,65536,1.5080827077229817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2560,512,0.032920890384250216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,16384,0.08908533387713963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2560,256,0.01651022169325087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,12288,0.0652444428867764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,16384,0.2854693465762668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,65536,1.1405804951985676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,16384,0.39196001158820254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,12288,0.2156764401329888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,51200,0.8914960225423177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,8192,0.04551288816663954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,12288,0.2984044551849365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,10240,0.1790835592481825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,7168,0.03790488839149475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,10240,0.24785423278808594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,8192,0.1399573352601793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,65536,1.499036471048991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,8192,0.19741243786282012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,6144,0.033555554019080266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,5120,0.028897778855429754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,7168,0.172980440987481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,51200,1.1958612865871854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,4096,0.024305777417288885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,6144,0.15107911162906223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,5120,0.08842400047514175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,5120,0.1282151142756144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,3584,0.022336888644430373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,4096,0.072708441151513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,4096,0.10764266384972467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,3072,0.01919644408755832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,3584,0.06419466601477729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,3584,0.0969582200050354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,2560,0.01736088924937778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,10240,0.05422844489415487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,3072,0.05601421991984049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,2048,0.01499555508295695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,2560,0.046912001238928906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,2560,0.07587822278340657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,1536,0.011614222493436603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,2048,0.06572533316082425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,2048,0.04006933172543844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,1024,0.009372444616423713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,1536,0.03275555703375075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,1536,0.05333155393600464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,768,0.008113777471913232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,1024,0.024992000725534227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,1024,0.04232888751559787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,512,0.0069857777820693115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,768,0.02186044388347202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,256,0.005601777798599667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,7168,0.1206444501876831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,512,0.018008000320858426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,512,0.03264355659484863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,128,0.004848000076082018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,6144,0.1041226651933458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,256,0.028142223755518597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,256,0.015824889143308003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,64,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,2048,32,0.005486222190989389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,128,0.024271999796231587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,128,0.015160888433456421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,64,0.014766222900814481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,2048,32,0.014797333214018079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,65536,0.23591465420193145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,51200,0.1969306601418389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,3072,0.08643644385867649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,16384,0.06575377782185872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,16384,0.26789866553412545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,12288,0.04548888736300998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,2048,768,0.03798310955365499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,16384,0.4045875602298313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,51200,0.8156568739149305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,10240,0.03980177640914917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,65536,1.0431973139444988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,12288,0.20187821653154162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,8192,0.03118577930662367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,7168,0.027610666222042505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,10240,0.16658133930630153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,10240,0.247977786593967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,8192,0.13060711489783391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,8192,0.19545155101352266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,6144,0.024347555306222703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,7168,0.11309956179724799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,7168,0.17218400372399223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,51200,1.1746098200480144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,4096,0.017158221867349412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,6144,0.14965866671668157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,5120,0.0817742215262519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,3584,0.015903110305468243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,5120,0.12855911254882812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,4096,0.06711555851830377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,4096,0.1066711081398858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,3072,0.013943110903104147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,3584,0.059141331248813205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,3584,0.09627733627955119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,2560,0.01236977759334776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,3072,0.051669332716200084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,3072,0.08589777681562637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,2048,0.0103493332862854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,2560,0.04414844512939453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,2560,0.0758462217119005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,1536,0.008601778083377415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,2048,0.036120888259675764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,2048,0.06461866696675618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,1024,0.0076044441925154785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,1536,0.029875556627909344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,1536,0.05272710985607571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,12288,0.29693155818515354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,768,0.006305777778228124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,1024,0.02332177758216858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,1024,0.042021334171295166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,512,0.005264889034960005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,5120,0.020950223008791607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,768,0.037560890118281044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,768,0.02051466703414917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,256,0.004574222283230888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,512,0.032481776343451604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,512,0.01720622181892395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,128,0.004119111018048393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,6144,0.09735555781258477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,64,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,65536,1.4893875122070312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,256,0.015081778168678284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,128,0.024339555038346186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,128,0.014139556222491793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,64,0.014089778065681458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1536,32,0.013912000589900546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,65536,0.18372800615098742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,51200,0.14743288358052573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,16384,0.048932443062464394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,16384,0.25482132699754506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,51200,0.7732595337761773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,12288,0.034557332595189415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,65536,0.9854355918036567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,16384,0.35390488306681317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1536,256,0.02805244591501024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1536,32,0.0041697778635554844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,10240,0.02886755598915948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,8192,0.023745778534147475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,51200,1.0622168646918404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,12288,0.1919004387325711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,12288,0.2696835464901394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,7168,0.021288888321982488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,10240,0.1587795548968845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,65536,1.3480728997124567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,10240,0.22378312216864693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,6144,0.019291554888089497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,8192,0.12337956163618301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,5120,0.01680888897842831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,8192,0.17739644315507677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,4096,0.01461155547036065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,7168,0.10679822497897679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,6144,0.1361680030822754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,5120,0.1165706713994344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,3584,0.01260444439119763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,4096,0.09749333063761394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,3072,0.011662222445011139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,3584,0.08791999684439765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,3584,0.0554257763756646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,2560,0.010039110978444418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,3072,0.04799377918243408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,3072,0.07807022333145142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,2048,0.008789333204428354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,2560,0.04043644335534837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,2560,0.06958578030268352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,1536,0.007633777956167857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,2048,0.05957688887914022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,1536,0.02868177824550205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,1536,0.05076355404324002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,1024,0.006243555496136348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,1024,0.022388445006476507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,1024,0.03932711150911119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,768,0.00554666668176651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,7168,0.15587111314137778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,512,0.004914666629499859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,6144,0.09166400300131904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,5120,0.07735555701785617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,768,0.019555555449591745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,768,0.035271111461851336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,256,0.004182222402758068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,128,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,4096,0.06323555443021986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,512,0.03029777937465244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,512,0.016184889607959323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,256,0.026779555612140234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,256,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,64,0.003626666549179289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,1024,32,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,128,0.013456888496875763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,64,0.013515555196338229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,32,0.013187555803192986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,65536,0.14727644125620523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,51200,0.11419822110070123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,16384,0.03894666830698649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,1024,2048,0.03400977783732944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,12288,0.027914666467242773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,16384,0.24539377954271105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,16384,0.3521440029144287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,10240,0.023523555861579046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,12288,0.18508977360195586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,51200,0.7401839892069498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,12288,0.2698124514685737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,65536,0.9482204649183484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,8192,0.01953066719902886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,10240,0.15285332997639975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,7168,0.017821333474583097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,8192,0.11945866213904487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,8192,0.17774666680230033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,51200,1.0561964246961806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,1024,128,0.023758222659428913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,6144,0.0158933334880405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,7168,0.10243288675944011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,5120,0.01370488852262497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,65536,1.3432248433430989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,7168,0.15596621566348606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,4096,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,6144,0.08787644571728176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,5120,0.11629866229163276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,3584,0.010414222048388587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,6144,0.13627021842532688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,5120,0.07416711250940959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,4096,0.09709333048926459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,4096,0.06068266762627495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,3584,0.0881706674893697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,2560,0.008662222160233391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,3584,0.052729778819613986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,2048,0.0076453329788313965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,3072,0.04628533456060621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,2560,0.06868444548712836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,2560,0.039510223600599505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,1536,0.006701333241330252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,2048,0.03288266725010342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,2048,0.05840355820126004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,1024,0.006152888966931238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,1536,0.027457776996824477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,768,0.005559999909665849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,1024,0.02160266704029507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,1024,0.038682666089799665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,10240,0.22294667032029894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,512,0.004570666700601578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,768,0.019089778264363606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,768,0.03499022126197815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,512,0.029841777351167467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,256,0.013754666679435305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,256,0.026053332620196875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,128,0.003559111307064692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,128,0.0131217779384719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,128,0.022799111074871484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,64,0.0032266666077905228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,3072,0.010110222631030613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,32,0.003485333174467087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,65536,0.10160533587137859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,3072,0.07853511306974623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,64,0.012844444149070315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,32,0.01316088851955202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,51200,0.07945422331492107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,768,1536,0.04878488845295376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,16384,0.03217511044608222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,768,256,0.00388711111413108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,768,512,0.015808888607554965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,12288,0.02368444369898902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,16384,0.2352844344245063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,51200,0.710385799407959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,10240,0.020962667134073045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,12288,0.17776532967885336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,16384,0.34883912404378253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,12288,0.265976005130344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,8192,0.017601778109868366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,51200,1.0434275733100045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,8192,0.11433688799540202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,7168,0.015489778584904142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,65536,1.328298674689399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,6144,0.014076444837782117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,7168,0.09842044115066528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,7168,0.15466845035552979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,5120,0.012102222277058495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,6144,0.08433689011467828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,6144,0.1352862252129449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,5120,0.11595822705162896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,4096,0.05761155817243788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,3584,0.009346666435400644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,4096,0.09679110844930013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,65536,0.9054578145345052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,3072,0.00868088917599784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,3584,0.05059022373623318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,3584,0.08694399727715386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,2560,0.007660444411966536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,3072,0.04256177941958109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,3072,0.07739555835723877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,2048,0.0079644446571668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,8192,0.1758035553826226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,2560,0.06699199808968438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,1536,0.006608888920810487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,2048,0.056847108734978564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,1536,0.026175111532211304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,1024,0.005544888890451855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,1536,0.04821777674886915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,4096,0.010102222363154093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,768,0.004863111095296012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,1024,0.02093511157565647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,5120,0.07098755571577284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,768,0.034853332572513156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,512,0.00453244439429707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,512,0.015427556302812366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,512,0.02983733349376255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,256,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,10240,0.14714754952324763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,256,0.013336000343163809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,128,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,2048,0.031621333625581526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,256,0.026847110854254827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,128,0.012749333348539142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,64,0.0035537779331207275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,128,0.02295555505487654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,512,32,0.003567111161020067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,64,0.012416000167528788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,1024,0.03838488790724013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,32,0.012486221889654795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,65536,0.05836177534527249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,51200,0.04760622315936618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,768,0.01854933301607768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,16384,0.0188773340649075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,16384,0.2248542308807373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,512,10240,0.22057510746849907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,12288,0.018014222383499146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,51200,0.6764293246799045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,65536,0.8619413375854492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,10240,0.016176889340082806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,16384,0.3470319906870524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,12288,0.16980089081658256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,8192,0.013507555756303998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,51200,1.0376257366604276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,12288,0.26506845156351727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,10240,0.14006933901045057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,7168,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,10240,0.22088355488247344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,65536,1.3229395548502605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,8192,0.10879377524058025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,8192,0.17558044857449004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,7168,0.15444355540805393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,5120,0.009724444813198512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,7168,0.09343555238511826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,6144,0.07963644133673774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,6144,0.1344204478793674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,4096,0.008047111332416534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,3584,0.007510222494602203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,5120,0.06732000244988336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,5120,0.11484000417921279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,3072,0.006959111326270633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,4096,0.0540559987227122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,4096,0.09547999832365249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,512,2560,0.03730666637420654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,2560,0.006259555617968242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,3584,0.0861848857667711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,2048,0.005538666827811136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,3072,0.04145510991414388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,3072,0.07657688856124878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,1536,0.004911111046870549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,2560,0.0350213348865509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,2048,0.029799110359615747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,1024,0.004181333300140169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,1536,0.04794133371777005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,1024,0.01999022232161628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,1024,0.038041777080959745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,768,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,6144,0.010657777388890585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,512,0.0035422220826148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,768,0.017869333426157635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,768,0.034281777011023626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,256,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,512,0.029812445243199665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,512,0.015121777852376303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,128,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,256,0.012732444538010491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,256,0.025705777936511572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,128,0.0214346663819419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,64,0.0028862222615215513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,128,0.01240799989965227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,256,32,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,65536,0.04561777909596761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,64,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,32,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,3584,0.04846488767200046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,51200,0.037026666932635836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,2560,0.06548444430033366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,16384,0.012427555190192329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,256,2048,0.05669244130452474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,12288,0.010447111394670276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,256,1536,0.02536533276240031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,16384,0.2244782182905409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,12288,0.16933511363135445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,16384,0.34670223130120176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,10240,0.01167555567291048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,12288,0.26468178961012095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,8192,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,51200,0.6758497556050619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,65536,0.862369802263048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,10240,0.13943289385901556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,7168,0.011583111352390714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,10240,0.2202986611260308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,6144,0.010409778190983666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,8192,0.17509155803256563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,7168,0.09269511037402683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,7168,0.1534364488389757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,51200,1.0359697341918945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,5120,0.009306666751702627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,4096,0.007616000043021307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,5120,0.06692355871200562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,65536,1.320673730638292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,6144,0.13345777988433838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,5120,0.11479200257195367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,3584,0.007272000114123027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,4096,0.05394577648904589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,3072,0.006593777901596493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,4096,0.09581244654125637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,3584,0.08586844470765854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,3584,0.04678933487998115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,2560,0.005946666830115848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,3072,0.040956444210476346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,3072,0.07608444160885282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,2048,0.0052373334765434265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,1536,0.0046951112647851305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,2560,0.06532000170813666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,2560,0.035826666487587824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,2048,0.029817776547537908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,2048,0.0567164421081543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,1536,0.02528800070285797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,1536,0.04754933383729723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,1024,0.0380311111609141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,1024,0.019904888338512845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,512,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,8192,0.10797688696119521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,768,0.017855111095640395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,768,0.03427555494838291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,256,0.003145777723855443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,512,0.014493332968817817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,512,0.029464887248145208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,128,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,256,0.012509333590666452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,256,0.025073778298166063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,6144,0.07966666751437716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,64,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1792,128,128,0.02161600026819441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,128,0.012030222349696688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,65536,0.044900443818834096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,64,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,128,32,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,51200,0.034576889541414045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,16384,0.014139556222491793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,12288,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,16384,0.22397510210673013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,12288,0.16946755515204537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,10240,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,8192,0.010354667074150508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,1024,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,7168,0.009655111365848118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,768,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,6144,0.00903200027015474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,51200,0.6757289038764106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,8192,0.10800533162222968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,5120,0.008636444807052612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,65536,0.8606870969136556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,4096,0.00795288880666097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,3584,0.006952889263629913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,6144,0.07919466495513916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,5120,0.06738933589723375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,3072,0.006295111030340195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,4096,0.053842667076322764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,3584,0.046560890144772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,128,32,0.002874666617976295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,2048,0.0052488889131281115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,3072,0.03981155488226149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,2560,0.03487911158137851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,1024,0.0038764443662431505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,2048,0.029863112502627905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,768,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,1536,0.0247999992635515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,512,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,1024,0.020096888144810993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,256,0.003042666655447748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,768,0.01753777762254079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,128,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,512,0.014495111174053617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,64,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,256,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,32,0.0026231110095977783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,128,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,64,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,65536,0.04076000054677328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,10240,0.13907821973164877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,32,0.011685333318180509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,51200,0.03325600094265408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,16384,0.009639999932712978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,64,7168,0.09257155656814575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,2560,0.005928888916969299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,16384,0.22421956062316895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,10240,0.007961778177155389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,12288,0.16895111401875815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,7168,0.006919999917348226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,64,1536,0.004527111020353106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,6144,0.010403555300500657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,10240,0.13934044043223062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,8192,0.10725244548585679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,7168,0.09242400195863511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,5120,0.009536888864305284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,4096,0.00868088917599784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,65536,0.8618559837341309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,6144,0.07888711161083646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,3584,0.008293333152929941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,3072,0.006584888945023219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,5120,0.06698489189147949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,4096,0.05347555544641283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,2560,0.005741333381997214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,2048,0.005879999862776862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,3584,0.046988444195853345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,1536,0.004595555365085602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,3072,0.03990666733847724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,2560,0.03439999951256646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,1024,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,2048,0.029847111966874864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,768,0.003546666767862108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,512,0.003208000005947219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,1536,0.025358221597141687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,12288,0.008653333617581261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,256,0.002895999906791581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,1024,0.019903111788961623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,128,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,768,0.01773866679933336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,64,0.0028702221396896574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,512,0.014491554763582019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,32,0.002855111120475663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,256,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,128,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,64,0.011777777638700275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1792,32,8192,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,32,0.011428444749779172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1792,32,51200,0.675813357035319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,12288,1.543082661098904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,10240,1.4190204408433702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,12288,1.7587626775105794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,16384,2.043611526489258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,16384,2.3726213243272567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,8192,1.1389573415120442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,7168,0.9830026626586914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,8192,1.1186648474799263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,10240,1.4155155817667644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,7168,0.9334551493326823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,6144,0.8819262186686198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,5120,0.7256071302625867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,4096,0.5633795526292589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,5120,0.6760257614983453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,6144,0.8330151240030924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,3584,0.5977617899576823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,4096,0.5344035360548232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,3072,0.4490248892042372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,3072,0.410694228278266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,2560,0.3630373213026259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,2048,0.2611582279205322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,3584,0.516266663869222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,1536,0.22033866246541342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,1024,0.15806133217281765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,2560,0.45450666215684676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,2048,0.33722755644056535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,1024,0.17425510618421766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,1536,0.24367200003729927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,768,0.12364799446529812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,512,0.09402577744589911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,256,0.05928977992799547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,128,0.046705779102113515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,64,0.044715556833479136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,768,0.1438657840092977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,32,0.04701155424118042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,256,0.11173689365386963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,128,0.1007395585378011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,512,0.12169688277774388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,64,0.104839113023546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,32,0.10244177447424994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,65536,51200,6.438799116346572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,16384,1.5725537406073675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,16384,1.873602761162652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,12288,1.3404195573594835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,12288,1.3711546791924372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,10240,1.0416000154283311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,65536,51200,8.932272169325087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,8192,0.8710959752400717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,10240,1.1074373457166884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,7168,0.7441146638658312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,8192,0.8830035527547201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,51200,4.756446414523654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,6144,0.6578390863206651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,5120,0.4484791225857205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,7168,0.8480177985297309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,6144,0.7325688997904459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,4096,0.46197064717610675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,4096,0.44916889402601456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,3584,0.3489528761969672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,3072,0.3219208982255724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,3584,0.3855813344319661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,5120,0.5551973448859321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,2560,0.2904222276475695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,3072,0.3268924554189046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,2048,0.18783466021219888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,1536,0.1550968885421753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,65536,6.204514821370442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,2048,0.2300728956858317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,1024,0.10905955235163371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,2560,0.310331556532118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,768,0.09403733412424724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,512,0.07028800249099731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,256,0.050029334094789296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,768,0.11927733156416152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,512,0.09594400061501397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,128,0.04247466723124186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,256,0.08800088697009617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,64,0.035790221558676824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,51200,32,0.03639111253950331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,51200,6.6763733757866754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,128,0.08137422137790255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,64,0.08134133285946317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,32,0.08231466346316867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,1536,0.18067910936143664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,1024,0.14384178320566812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,16384,0.43880534172058105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,12288,0.346910211775038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,51200,1.6790275573730469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,65536,2.098889880710178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,16384,0.6951724688212076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,10240,0.36727288034227157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,51200,65536,9.114913092719183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,8192,0.22849689589606392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,12288,0.5259751213921441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,7168,0.2239848772684733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,6144,0.17835466066996256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,51200,2.419495052761502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,8192,0.40402666727701825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,10240,0.5251502460903591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,7168,0.3112773365444607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,4096,0.14847111701965332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,3584,0.13581155406104192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,5120,0.21248977714114717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,4096,0.18204977777269152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,3072,0.10884533325831096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,3584,0.1545377837287055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,2560,0.08579555484983657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,65536,3.2913004557291665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,2048,0.07319644424650404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,3072,0.1322800053490533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,1536,0.05520266625616285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,1024,0.03575999869240655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,768,0.028424888849258423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,1536,0.076292441950904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,1024,0.06258933411704169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,512,0.02293599976433648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,256,0.018826666805479262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,768,0.046853333711624146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,128,0.01570933394961887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,64,0.013389333254761167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,512,0.039424889617496066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,256,0.034244444635179304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,32,0.012319111161761813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,128,0.033424887392256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,64,0.03291911217901442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,32,0.03221688999070062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,16384,5120,0.14735644393497044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,6144,0.28659555647108287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,16384,0.36267820994059247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,2560,0.12298756175571018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,16384,2048,0.09502133395936753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,16384,0.5589680141872829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,12288,0.27184976471794975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,8192,0.17964711454179552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,10240,0.23315644264221191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,12288,0.4124604331122504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,10240,0.33885688251919216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,51200,1.3069182501898873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,7168,0.18061421977149117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,65536,1.5666595035129125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,5120,0.13184977902306452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,6144,0.13446933693355984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,8192,0.27412621180216473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,7168,0.23441865709092882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,6144,0.24705065621270073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,3584,0.07985511091020372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,4096,0.10401066806581284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,3072,0.07604889074961345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,4096,0.1395448843638102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,5120,0.1796728902392917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,2560,0.06576889091067843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,2048,0.0484444432788425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,51200,1.8802871704101562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,1536,0.04478133387035794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,3072,0.10860088798734878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,1024,0.02804888950453864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,2560,0.10337777932484944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,768,0.022804444034894306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,2048,0.08068977461920844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,512,0.017881777551439073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,256,0.014779556128713818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,1536,0.0629955530166626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,128,0.011394666300879585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,1024,0.0495377779006958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,768,0.03960444529851278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,64,0.010016889207892949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,512,0.03274222215016683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,12288,32,0.010056888891590966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,256,0.028373334142896865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,128,0.02740977704524994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,65536,2.5755422380235458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,64,0.027259555127885606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,32,0.02676711148685879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,16384,0.26602400673760307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,12288,0.20332888762156168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,16384,0.49639733632405597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,12288,3584,0.1240053309334649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,51200,0.8739466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,10240,0.17484711276160347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,65536,1.1538879606458876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,8192,0.16532888677385119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,12288,0.3763599925571018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,10240,0.3005768987867567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,8192,0.23776178889804414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,7168,0.14367732736799452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,6144,0.10722044441435073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,5120,0.09142666392856175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,4096,0.07910399966769747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,7168,0.22976088523864746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,6144,0.1798559957080417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,3584,0.07081688774956597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,5120,0.1811831129921807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,3072,0.06020444631576538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,4096,0.12466933992173936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,2560,0.055213332176208496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,2048,0.041327999697791204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,3584,0.11740977234310573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,1536,0.03294666608174642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,3072,0.09797066450119019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,1024,0.025105777713987563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,2560,0.08500711123148601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,768,0.020248000820477802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,2048,0.07228889067967732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,512,0.015256888336605497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,1536,0.056574225425720215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,256,0.011863999896579318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,1024,0.04328533344798618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,128,0.009686222506894005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,768,0.035451554589801364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,64,0.008641777767075432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,512,0.030258665482203167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,65536,2.2276880476209855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,10240,32,0.008663111262851292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,256,0.025772444076008264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,128,0.02474222249454922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,64,0.02471911079353756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,32,0.02490933405028449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,16384,0.24077243275112578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,12288,0.17038933436075845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,16384,0.4298657841152615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,51200,0.7323075400458442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,10240,0.14783199628194174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,65536,0.9472249348958334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,8192,0.11681244108412002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,12288,0.3290097713470459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,7168,0.09913600153393215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,10240,0.3215297857920329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,6144,0.08563555611504449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,8192,0.22875910335116914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,7168,0.18439822726779512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,5120,0.08153688907623291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,4096,0.07385155227449205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,6144,0.16434489356146917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,51200,1.4137875239054363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,3584,0.061892443233066134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,3072,0.05781866444481743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,2560,0.04517599940299988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,4096,0.10817688703536987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,3584,0.09966578086217244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,2048,0.03649955656793382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,3072,0.08627733257081772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,1536,0.02773333258099026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,65536,1.8257759941948786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,1024,0.020617778102556866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,2560,0.07470044162538317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,768,0.016873778568373788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,2048,0.062315556738111705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,512,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,1536,0.049230221245023936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,256,0.010288889209429422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,1024,0.03826311230659485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,10240,51200,1.669891569349501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,64,0.007366221812036302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,512,0.02643555568324195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,32,0.007594666547245449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,256,0.022799111074871484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,128,0.022311111291249592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,64,0.022006221943431433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,32,0.021681777305073206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,16384,0.2149511045879788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,5120,0.13954667250315347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,51200,0.6388986905415853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,65536,0.8186728689405652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,12288,0.15101867251926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,16384,0.39657245741950137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,10240,0.17989599704742432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,8192,128,0.008264888491895463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,8192,768,0.03164622187614441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,10240,0.24352622032165527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,8192,0.14359377490149602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,7168,0.11387466059790717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,6144,0.10742311345206366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,51200,1.3238026301066081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,5120,0.08811822202470566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,6144,0.14565511544545492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,4096,0.0729973316192627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,65536,1.6925279829237196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,5120,0.12356444199879964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,3584,0.05889422363705105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,3072,0.05169599917199877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,4096,0.10114666488435532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,2560,0.03680088784959581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,3584,0.09187555313110352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,2048,0.030442665020624798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,3072,0.08141155375374688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,2560,0.06929600238800049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,1024,0.017997332745128207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,2048,0.05790755483839247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,768,0.015096000499195524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,1536,0.04670400089687771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,512,0.012192000117566852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,1024,0.035832888550228544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,256,0.009038222332795462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,768,0.029503110382292006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,128,0.008011555506123437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,512,0.024865777956114873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,64,0.007136888802051544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,256,0.02179644505182902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,8192,0.19186933835347494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,32,0.008648888932334052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,128,0.020975111259354487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,7168,0.16873599423302543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,32,0.020587555236286588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,7168,1536,0.023751111494170293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,51200,0.5185875362820095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,65536,0.6714897685580783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,16384,0.178838226530287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,12288,0.15292621983422175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,12288,0.3233475685119629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,10240,0.12897066275278726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,16384,0.4082746770646837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,8192,0.10092800193362766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,12288,0.2732915613386366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,7168,64,0.020920000142521326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,7168,0.08314400249057345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,51200,1.200657738579644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,6144,0.0788595543967353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,8192,0.18356445100572374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,5120,0.06649866369035509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,7168,0.1562097734875149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,65536,1.5464515686035156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,4096,0.0465191106001536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,3584,0.04339822133382162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,6144,0.14749333593580458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,3072,0.037137776613235474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,2560,0.033717334270477295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,4096,0.09421955876880223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,2048,0.027855998939938013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,3584,0.0837635530365838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,1536,0.022633777724372015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,2560,0.06431466341018677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,1024,0.017501332693629794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,768,0.015121777852376303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,2048,0.053159111075931124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,1536,0.042615112331178456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,512,0.011679111255539788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,1024,0.033534222178988986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,256,0.008832000195980072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,128,0.0073724447025193115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,768,0.028559999333487615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,64,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,6144,32,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,256,0.020281778441535104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,128,0.0199297782447603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,64,0.01982666717635261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,32,0.019555555449591745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,10240,0.2249671088324653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,16384,0.13432621955871582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,51200,0.4217253261142307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,5120,0.11453955703311497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,12288,0.11716889010535346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,3072,0.07200888792673747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,10240,0.09025066428714329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,8192,0.07265422079298231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,12288,0.2513688935173882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,10240,0.20704800552792021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,7168,0.0688248872756958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,6144,512,0.023378666904237535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,6144,0.05894755654864841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,51200,1.0802453358968098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,8192,0.16814933882819283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,5120,0.04850577645831638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,4096,0.04045155644416809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,7168,0.14312267303466797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,3584,0.03583022289805942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,65536,1.403958214653863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,5120,0.10502844386630589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,3072,0.0314702226055993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,4096,0.08573689063390096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,2560,0.02667377723587884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,3584,0.07702933417426215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,2048,0.021967111362351313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,1536,0.017885333961910672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,3072,0.06744266880883111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,2560,0.05744355254703098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,1024,0.013570666313171387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,2048,0.049492445256974965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,768,0.010828444527255164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,1536,0.03944799966282315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,1024,0.030866665972603693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,16384,0.33500178654988605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,256,0.0069360000391801195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,768,0.025916443930731878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,128,0.006524444454246097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,512,0.021683555510309007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,64,0.005961777849329843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,32,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,256,0.019204444355434842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,128,0.018565333551830716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,64,0.01822933389080895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,32,0.017892445127169292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,5120,6144,0.12368444601694743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,51200,0.3770888911353217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,65536,0.45880619684855145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,16384,0.12565510802798802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,12288,0.09727822409735785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,65536,0.535736878712972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,10240,0.08446755674150254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,16384,0.3302328851487902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,8192,0.07275111145443387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,5120,512,0.008621333373917473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,12288,0.22870667775472006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,7168,0.061794665124681264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,6144,0.05567289061016507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,10240,0.1864933305316501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,5120,0.042691555288102895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,51200,0.9729075961642795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,8192,0.15314755174848768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,7168,0.12981866465674505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,3584,0.0369395547442966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,6144,0.12247999509175618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,65536,1.2454666561550565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,3072,0.03260622090763516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,5120,0.09609955549240112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,4096,0.07906488577524821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,3584,0.07039911217159696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,1536,0.016231111354298063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,2560,0.05207644568549263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,1024,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,2048,0.04377955529424879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,768,0.010151111417346531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,1536,0.035812444157070585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,512,0.007984889050324758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,1024,0.027543110979927912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,256,0.006625777731339137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,768,0.02352711061636607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,128,0.005601777798599667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,512,0.02028888960679372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,64,0.004872000051869286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,256,0.017847110827763874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,32,0.005201777650250329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,128,0.01715377800994449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,64,0.017186666528383892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,32,0.016536000702116225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,4096,0.034830222527186074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,65536,0.3906577693091498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,51200,0.34612533781263566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,2560,0.02331999937693278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,4096,2048,0.021201777789327834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,4096,3072,0.062031997574700244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,12288,0.08462666802936131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,10240,0.0772577789094713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,8192,0.05726133452521431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,12288,0.21780089537302652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,16384,0.3065742121802436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,10240,0.1778951088587443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,7168,0.051947553952534996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,6144,0.0453324450386895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,8192,0.14052355289459229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,5120,0.03790844480196635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,7168,0.1271831062104967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,4096,0.030543999539481267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,6144,0.10831111007266575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,3584,0.02756711178355747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,65536,1.1776640150282118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,51200,0.9277884165445963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,3072,0.023406222462654114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,2560,0.02038755516211192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,5120,0.09231111076143052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,2048,0.0173999998304579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,4096,0.07562933365503947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,1536,0.014480888843536377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,3584,0.06775022215313382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,1024,0.010668444136778513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,3072,0.05901777744293213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,768,0.009024000002278222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,2560,0.04975377851062351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,512,0.007299555672539606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,1536,0.034619556532965765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,256,0.005997333261701796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,1024,0.026446221603287592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,128,0.005227555417352253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,768,0.02295911146534814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,512,0.01957244508796268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,256,0.01717688971095615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,32,0.004923555586073133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,128,0.01650399963061015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,16384,0.11640000343322754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,64,0.01648177703221639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,32,0.016367110941145156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,16384,0.09851821925905015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,51200,0.25931911998324925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,65536,0.3736017809973822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,12288,0.07294844256507026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,10240,0.06947111421161227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,16384,0.27778400315178764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,12288,0.22666578822665742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,8192,0.048920889695485435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,7168,0.04296977652443779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,10240,0.1750782198376126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,6144,0.03710755705833435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3584,2048,0.04196088843875461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,8192,0.1406995587878757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,5120,0.0307608875963423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,7168,0.11831643846299912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3584,64,0.004880889008442561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,4096,0.02539644473128849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,65536,1.1222355100843642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,3584,0.023401778605249193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,6144,0.10394755336973403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,5120,0.08916266759236653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,3072,0.020735111501481798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,2560,0.01817244456874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,2048,0.01566755606068505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,4096,0.07216178046332465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,3584,0.06382489204406738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,1536,0.013184000220563678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,1024,0.010382222632567087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,768,0.00867911097076204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,2560,0.04810577630996704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,1536,0.032989333073298134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,512,0.007274666594134436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,1024,0.02542488939232296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,256,0.005714666512277391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,128,0.0052062223354975385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,768,0.021977777282396953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,64,0.004716444346639845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,512,0.018686221705542672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,256,0.016487111647923786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,128,0.016135111451148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,64,0.015857777661747403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,32,0.015479111009173922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,65536,0.28557689984639484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,51200,0.8793448872036405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,51200,0.24356532096862793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,16384,0.08784711360931396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,12288,0.061851554446750216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,10240,0.057293335596720375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,16384,0.26168889469570583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,12288,0.20747644371456572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,3072,0.055677334467569985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,8192,0.042223999897638954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,3072,2048,0.03975199990802341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,7168,0.03832533293300205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,10240,0.17030133141411674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,6144,0.030604445272021826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,5120,0.028635554843478735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,4096,0.022706665926509436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,8192,0.12759199407365587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,7168,0.11072178019417657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,51200,0.8196853531731499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,6144,0.09625511036978827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,65536,1.0388249291314018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,3072,32,0.0047022220161226065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,5120,0.08199999729792277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,3072,0.01819022165404426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,2560,0.015787555111779105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,2048,0.013510222236315409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,4096,0.06901422474119398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,3584,0.05906755394405789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,3072,0.051273776425255664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,2560,0.0443520016140408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,2048,0.036912888288497925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,1536,0.031088001198238794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,512,0.006353777729802662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,256,0.0052168890833854675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,1024,0.0239964442120658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,128,0.004565333326657613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,768,0.020593777298927307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,512,0.017887110511461895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,64,0.0041751112374994485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,256,0.015807999504937064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,32,0.004243555582231945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,128,0.015463999576038785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,64,0.015127110812399121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2560,32,0.014837332897716098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,65536,0.26280800501505536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,51200,0.19025866190592447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,16384,0.06752533382839628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,3584,0.020668443706300523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,12288,0.0532622238000234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,1536,0.01128266668981976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,1024,0.009020444419648912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,16384,0.24791023466322157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,10240,0.04211289021703932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2560,768,0.0076453329788313965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,8192,0.034781333472993635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,7168,0.030823998981051978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,6144,0.02492622203297085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,12288,0.1851146618525187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,51200,0.7863893508911133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,10240,0.15216710832383898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,8192,0.11930044492085774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,5120,0.022282666630215112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,7168,0.10542222526338364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,3584,0.016920889417330425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,4096,0.01867466668287913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,3072,0.014941333068741692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,2560,0.013436444103717804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,6144,0.09142400158776177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,5120,0.07819910844167073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,4096,0.06320444742838542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,2048,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,1536,0.009200000100665623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,3072,0.048977779017554395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,1024,0.007595555649863348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,2560,0.04222755630811056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,768,0.006613333192136552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,2048,0.03497066762712266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,512,0.005798222290145026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,1536,0.029145777225494385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,256,0.00488800017370118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,1024,0.023024888502226934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,128,0.0041884444653987885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,768,0.019985778464211356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,64,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,2048,32,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,256,0.015150222513410779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,128,0.014509333504570855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,64,0.014449778530332776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,32,0.014149333039919535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,65536,0.21386044555240205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,51200,0.16398310661315918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,16384,0.057461334599388965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,12288,0.04718666606479221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,65536,0.9879208670722114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,16384,0.2365493244594998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,10240,0.03689333465364244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,12288,0.17829155921936035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,8192,0.029029332929187354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,7168,0.025813332862324182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,3584,0.055804444683922656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,51200,0.7215466499328613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,10240,0.14511999819013807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,6144,0.022138666775491502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,8192,0.11412178145514594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,5120,0.01907911068863339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,4096,0.016394666499561734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,7168,0.09974577691819932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,3584,0.014942222171359591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,3072,0.013245333400037555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,6144,0.08623733123143514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,5120,0.07322133249706693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,2048,512,0.017335999343130324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,4096,0.059115555551317006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,2048,0.010055999788973067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,3584,0.052453332477145724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,1536,0.00867555538813273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,3072,0.04556711183653938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,1024,0.0069777775141927935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,2560,0.03930400146378411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,768,0.006287999865081575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,2048,0.03292355603641934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,512,0.00554044461912579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,1536,0.027314666244718764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,256,0.004242666479614046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,1024,0.02202577723397149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,128,0.003900444342030419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,768,0.0188773340649075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,64,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,512,0.016529776983790927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,32,0.0038968887594011095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,256,0.014340443743599786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,128,0.01402844488620758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,64,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,32,0.0138586668504609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,65536,0.17000888453589547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,16384,0.0460382236374749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,51200,0.13881777392493352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,12288,0.034430222378836736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,10240,0.028966221544477675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,8192,0.023834667272037927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,16384,0.21754754914177787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,12288,0.16148889064788818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1536,65536,0.9216142230563693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,10240,0.13232710626390246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,7168,0.02163022259871165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,6144,0.018791110979186166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,8192,0.10331200228797065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,5120,0.01646933290693495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,4096,0.014143110977278816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1536,2560,0.011247110863526663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,6144,0.07839822106891207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,51200,0.6566986507839626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,3584,0.012774222426944308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,5120,0.06657244761784871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,3072,0.011393778026103973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,65536,0.8394968774583605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,2560,0.010022222167915767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,4096,0.0536444452073839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,2048,0.008983111215962304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,1536,0.007594666547245449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,1024,0.006226666685607698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,3072,0.04214488797717624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,2560,0.035988443427615695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,2048,0.03035377793841892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,768,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,1536,0.02530755599339803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,512,0.004585777719815572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,256,0.0041786668201287585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,1024,0.020246222615242004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,768,0.017628444565667045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,256,0.013776000175211163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,128,0.013122667041089801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,32,0.0035537779331207275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,64,0.01308444473478529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,32,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,65536,0.12909066677093506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,51200,0.09981155395507812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,7168,0.09071466657850479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,16384,0.034501334031422935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,3584,0.04700444473160637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,12288,0.025158221522967022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,16384,0.21461333168877494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,128,0.003588444242874781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,10240,0.02164799968401591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,65536,0.831042660607232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,8192,0.018012444178263348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,51200,0.6506889131334093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,1024,64,0.003522666792074839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,7168,0.016770665844281513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,6144,0.014799111419253878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,5120,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,10240,0.13107111718919542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,8192,0.10249688890245225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,7168,0.08965155813429092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,4096,0.010843555960390302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,6144,0.07782044675615099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,3584,0.01035644445154402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,3072,0.009357333183288574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,2560,0.008329778081840938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,4096,0.053299556175867714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,3584,0.04663822385999891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,3072,0.04150044586923387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,2048,0.007424888511498769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,1536,0.00627377794848548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,2560,0.03462666604253981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,1024,0.00527022240890397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,768,0.00489066665371259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,2048,0.029494222667482164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,1536,0.025053333905008104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,512,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,1024,0.020000888241661918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,256,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,768,0.017589333984586928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,128,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,512,0.015459555718633862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,64,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,768,32,0.003572444534964032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,256,0.013391999734772576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,128,0.01311555587583118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,64,0.01274222218328052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,65536,0.10202222400241429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,32,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,1024,512,0.01587022178702884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,51200,0.0790426664882236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,12288,0.16052977244059244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,12288,0.027328888575236004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,10240,0.02331111166212294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,16384,0.2053511142730713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,12288,0.1534764501783583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,768,5120,0.06600711080763075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,8192,0.019831111033757527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,10240,0.1256728834576077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,7168,0.017456889152526855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,6144,0.012263110942310758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,5120,0.010269333091047075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,51200,0.6185519960191515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,8192,0.09708444277445476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,7168,0.08558489216698541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,3584,0.008751110898123847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,6144,0.07437866926193237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,5120,0.06275733311971028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,3072,0.00776533368561003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,4096,0.04970844586690267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,2560,0.007244444555706448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,3584,0.043904887305365674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,3072,0.038105779223971896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,2048,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,1536,0.005572444448868434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,2560,0.033324443631702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,1024,0.004639111045334074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,768,0.004171555654870139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,2048,0.02866577770974901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,16384,0.0321742229991489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,1536,0.024156444602542456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,512,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,1024,0.01955111159218682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,256,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,128,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,768,0.016840888394249808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,64,0.00313688897424274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,32,0.00314666661951277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,512,0.015009777413474189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,256,0.013191111385822296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,128,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,65536,0.051683555046717324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,64,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,51200,0.0412124428484175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,32,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,16384,0.018000000052981906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,12288,0.014988443917698331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,10240,0.014113777213626437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,16384,0.19568799601660836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,512,4096,0.009358222285906473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,12288,0.14533244238959417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,8192,0.01346933344999949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,7168,0.012079999678664737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,6144,0.010383110907342698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,8192,0.09179466962814331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,51200,0.5867022408379449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,7168,0.08062489165200128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,6144,0.06970755259195964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,5120,0.05884177817238701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,4096,0.047356443272696606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,3584,0.007281777759393056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,3072,0.006636444479227066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,3584,0.04199377695719401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,3072,0.036312000619040594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,2560,0.006090666684839461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,2048,0.00554666668176651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,2560,0.03152799937460158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,2048,0.027419555518362258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,1536,0.004874666531880696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,1024,0.004328888737493091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,512,65536,0.7886897722880045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,768,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,10240,0.11859999762641059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,1024,0.018545778261290658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,512,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,256,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,768,0.01676977839734819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,5120,0.00924355536699295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,128,0.0031840000301599503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,512,0.014440889159838358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,65536,0.7484301990932889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,256,0.01237422227859497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,32,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,128,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,65536,0.04256622327698601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,32,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,51200,0.035226666265063815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,16384,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,16384,0.19469243950313994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,12288,0.010354667074150508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,51200,0.5858133104112413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,10240,0.011858666936556498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,1536,0.02314222190115187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,65536,0.7459751235114204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,8192,0.010606221854686737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,7168,0.010054222411579555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,10240,0.11786577436659072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,8192,0.09134311146206325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,4096,0.008055110772450766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,6144,0.009879111415810054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,5120,0.009323555562231276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,4096,0.007624000310897827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,7168,0.08011111285951403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,3584,0.007285333342022366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,256,64,0.011768889096048145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,3072,0.00655644428398874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,6144,0.06903111272388034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,2560,0.005912000106440649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,5120,0.058373332023620605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,4096,0.04621422290802002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,2048,0.005244444641802046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,3584,0.04110577702522278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,1536,0.004566222015354368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,3072,0.035663998789257474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,1024,0.004087111188305749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,2560,0.03181511163711548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,768,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,512,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,1536,0.022837332553333704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,256,0.0033679999825027254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,1024,0.018559111489189994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,768,0.016359110673268635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,128,0.0029848888516426086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,512,0.01443555619981554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,64,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,128,32,0.002875555513633622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,256,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,128,0.012101333174440594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,64,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,65536,0.038988444540235735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,32,0.011372444530328115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,51200,0.031025777260462444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,16384,0.011585777832402123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,12288,0.14493955506218806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,12288,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,10240,0.009694221946928237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,16384,0.19481155607435438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,256,64,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,12288,0.14462221993340388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,10240,0.11826044983334011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,7168,0.009319110876984065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,6144,0.008678221868144141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,51200,0.5859831174214681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,8192,0.09129510985480414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,5120,0.008292444050312042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,65536,0.7458782196044922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,7168,0.07978489001592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,4096,0.007656888829337225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,6144,0.06906577613618639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,3584,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,3072,0.006588444527652528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,128,2048,0.02715822226471371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,2560,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,5120,0.05815022521548801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,2048,0.005261333452330695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,3584,0.04061155517896017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,3072,0.035368889570236206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,1024,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,2560,0.03153333399030898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,2048,0.027132444911532935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,768,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,1536,0.023043556345833674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,512,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,1024,0.01854222185081906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,768,0.016520000166363187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,128,0.0028906667398081887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,512,0.014482667048772177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,64,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,256,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,32,0.002550222186578645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,128,0.012094222009181976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,64,0.011720000041855706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,65536,0.04061866799990336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,32,0.011538666983445486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,8192,0.008984888593355814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,51200,0.03108355402946472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,16384,0.010386666489972008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,12288,0.013085333009560903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,16384,0.19455022282070586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,10240,0.011388444238238864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,8192,0.0107022225856781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,64,4096,0.04660800099372864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,1536,0.004567111117972268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,7168,0.00997866690158844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,51200,0.5852533446417915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,10240,0.11784266100989448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,65536,0.74599912431505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,8192,0.09093244208229913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,5120,0.012422222230169507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,4096,0.008952889177534316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,7168,0.07991377512613933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,64,256,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,3584,0.008279110822412703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,3072,0.007283555964628856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,6144,0.06936888562308417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,2560,0.0063546668324205614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,5120,0.057836446497175426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,2048,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,1536,0.004527111020353106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,3584,0.040752000278896756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,3072,0.03556888964441087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,1024,0.004015999949640698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,2560,0.03137866655985514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,768,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,2048,0.027116444375779893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,512,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,1536,0.0229795558585061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,256,0.0031840000301599503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,1024,0.018585777944988675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,128,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,768,0.016169778174824186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,64,0.0028862222615215513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,512,0.014440000057220459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,32,0.002526222210791376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,256,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,128,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,64,0.011427555647161273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,32,0.011536888778209686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,12288,0.1447111103269789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1537,32,6144,0.014095111025704278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1537,32,4096,0.0464933349026574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,16384,1.9564613766140406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,12288,1.4298942353990343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,16384,2.2820445166693792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,10240,1.1933928595648873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,12288,1.6470204459296331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,16384,2.0547608269585504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,8192,0.995290650261773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,12288,1.4867564307318792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,10240,1.3568888770209417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,8192,1.0732648637559679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,51200,6.262232886420356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,7168,0.800813357035319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,10240,1.2340097427368164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,7168,0.9017706976996528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,6144,0.6890426741706001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,5120,0.5378924475775825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,6144,0.8301084306504992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,7168,0.8479706446329752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,8192,0.9805929395887586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,4096,0.4191111193762885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,5120,0.6597768995496962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,6144,0.7117039892408582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,4096,0.5571902063157823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,51200,8.285068935818142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,5120,0.6076569027370876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,3072,0.3181511031256782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,4096,0.4939395586649577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,3584,0.4498000144958496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,3072,0.40174044503106016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,2560,0.26825155152214897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,2048,0.2135902245839437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,2560,0.343798213534885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,3584,0.43395111295912003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,3072,0.38477688365512425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,1536,0.1653884384367201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,2048,0.29476088947719997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,2560,0.32344532012939453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,1024,0.12007644441392686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,3584,0.3701911237504747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,1536,0.21994045045640734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,768,0.10095644659466213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,1536,0.21756800015767416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,2048,0.2822897699144152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,512,0.0714248882399665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,768,0.1334773302078247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,256,0.05420622229576111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,1024,0.1721351146697998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,768,0.14198844962649876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,128,0.04514844550026787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,512,0.11651644441816543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,256,0.10084088643391927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,64,0.039410667286978826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,256,0.1024986637963189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,128,0.07711199919382732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,65536,32,0.03972355524698893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,64,0.09890933169258966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,32,0.09698310825559829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,1024,0.16956888304816353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,512,0.11488710509406196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,65536,128,0.09813511371612549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,65536,51200,6.634367201063369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,16384,1.5140995449490016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,16384,1.8419812520345051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,51200,4.924769931369357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,12288,1.157865736219618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,16384,1.6512035793728297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,65536,6.462441762288411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,12288,1.2955955929226346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,10240,0.9082479476928711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,51200,6.555641598171658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,8192,0.6995137532552084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,12288,1.144953727722168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,10240,1.0631511476304796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,8192,0.846095985836453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,7168,0.616187572479248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,65536,8.763920254177517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,10240,1.0025901794433594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,7168,0.7185520066155328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,6144,0.5477937592400445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,5120,0.4169457753499349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,8192,0.7898080084058973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,6144,0.6290808783637153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,7168,0.6770124435424805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,5120,0.5480168660481771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,6144,0.5826960139804417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,4096,0.36519289016723633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,5120,0.4955600102742513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,3584,0.2902231216430664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,4096,0.41214844915601945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,3584,0.3720613320668538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,3072,0.25131199094984263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,4096,0.4060702323913574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,3072,0.3346106741163466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,2560,0.2564764552646213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,3584,0.357605324851142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,51200,5.381527794731988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,3072,0.3094160026974148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,2048,0.1701564391454061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,1536,0.15725689464145237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,2048,0.23684800995720756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,1024,0.09435555669996475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,1536,0.17564800050523546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,2560,0.2819911109076606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,768,0.08010044362809923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,1024,0.13618132803175184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,768,0.11106577846739028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,1536,0.20325777265760633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,768,0.117411560482449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,512,0.0562631090482076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,256,0.041454222467210554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,512,0.09682310952080621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,512,0.09789155589209662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,128,0.035184890031814575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,2560,0.2795440091027154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,256,0.07920977804395887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,256,0.0835297769970364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,64,0.03145155641767714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,128,0.07948355542288886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,128,0.0642568866411845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,51200,32,0.03161244591077169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,65536,6.817266676161025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,2048,0.2248986562093099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,32,0.07943644126256307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,51200,1024,0.1393244398964776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,51200,64,0.0784097777472602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,51200,1.4908515082465277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,65536,1.9739856719970703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,16384,0.45739465289645725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,12288,0.3677982224358453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,16384,0.6840524673461914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,51200,2.274615181816949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,10240,0.2889937824673123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,65536,2.9037191602918835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,12288,0.5033022032843696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,10240,0.40517510308159727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,16384,0.6836542023552789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,8192,0.32400443818834096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,12288,0.5106470849778917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,7168,0.19696266121334502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,8192,0.3413795630137126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,6144,0.16950666904449463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,10240,0.43608800570170086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,7168,0.28086309962802464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,5120,0.14937955803341335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,7168,0.3007395532396105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,6144,0.241829342312283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,51200,2.17684449089898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,5120,0.20315555731455484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,6144,0.2691528797149658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,4096,0.12014488379160564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,3584,0.11582756042480469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,4096,0.16530044873555502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,8192,0.2559555636511909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,3072,0.09346399704615276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,2560,0.08146755562888251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,3584,0.14690221680535212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,4096,0.1881048944261339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,5120,0.2224595546722412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,3584,0.1654133399327596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,3072,0.1279884444342719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,1536,0.04734577735265096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,3072,0.14719377623664007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,65536,2.8030870225694446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,2560,0.11111999882592095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,2048,0.10873511102464463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,2048,0.09319821993509929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,2560,0.12742400169372559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,1024,0.03501244386037191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,1536,0.08963733249240452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,1536,0.07413155502743192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,768,0.02644355595111847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,512,0.01978933314482371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,1024,0.05702400207519531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,256,0.01614755557643043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,1024,0.07169510920842488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,768,0.06378577815161811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,768,0.04619110955132378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,128,0.01791466606987847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,512,0.05288799934917026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,64,0.015140444040298462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,256,0.04389066828621758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,32,0.015584000282817416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,256,0.033075554503334895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,16384,128,0.03558133376969232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,64,0.03213511241806878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,32,0.03119822343190511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,16384,2048,0.06929155853059557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,51200,0.9654311074150933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,512,0.03824533356560601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,65536,1.3442790773179796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,16384,128,0.033278223541047834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,16384,0.3532124360402425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,12288,0.26502754953172475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,16384,0.5483022265964085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,10240,0.22827911376953125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,51200,1.8064320882161458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,16384,0.5834124353196886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,65536,2.3734728495279946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,12288,0.43555466334025067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,10240,0.33708622720506454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,8192,0.15961599349975586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,10240,0.3574133449130588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,7168,0.14435466130574545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,8192,0.2883111106024848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,7168,0.2277831236521403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,6144,0.14258844322628444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,7168,0.2605280081431071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,12288,0.4198284414079454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,6144,0.19616356160905626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,5120,0.10352533393436009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,4096,0.08345155583487616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,6144,0.22690312067667642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,5120,0.1661635504828559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,3584,0.07134222322040133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,5120,0.18925066788991293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,4096,0.13650755087534586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,4096,0.15812622176276311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,3072,0.06811377737257215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,3584,0.12099644872877334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,3584,0.14140444331698948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,8192,0.2622097863091363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,2560,0.051579554875691734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,3072,0.1066888901922438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,2048,0.04338666796684265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,3072,0.12542043791876897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,2560,0.1095199982325236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,2560,0.09283555878533258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,1536,0.03728711273935106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,2048,0.07748177978727552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,1024,0.024654222859276667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,2048,0.09370933638678657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,768,0.021359999974568684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,1536,0.061347557438744434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,1536,0.07766489187876384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,1024,0.04675555560323927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,512,0.015882665912310284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,1024,0.06249155600865682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,768,0.0536373323864407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,768,0.03860177927547031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,256,0.01237777786122428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,512,0.04612444506751167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,512,0.03196355700492859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,128,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,65536,2.3104657067192926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,256,0.03763644562827216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,256,0.027639999985694885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,32,0.009657777845859528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,128,0.031175110075208876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,128,0.027120888233184814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,64,0.026718222432666357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,12288,32,0.026184888349639043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,12288,51200,1.8096603817409938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,12288,64,0.009719111025333405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,65536,1.2040106455485027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,51200,1.0529893239339192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,16384,0.2924133406745063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,12288,0.2316124439239502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,16384,0.5213653246561686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,12288,0.3625653319888645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,10240,0.19278132915496826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,16384,0.5491724544101292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,65536,2.1242088741726346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,12288,0.4037288824717204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,10240,0.29506222407023114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,8192,0.17417332861158583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,8192,0.23492889934115938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,7168,0.13464266724056667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,10240,0.3338889016045465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,7168,0.20338932673136392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,8192,0.2687315675947401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,7168,0.24034667015075684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,5120,0.11070311069488525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,6144,0.174145778020223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,6144,0.20708621872795951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,4096,0.08659199873606364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,51200,1.6787804497612848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,5120,0.1476773288514879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,3584,0.07806489202711317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,5120,0.17956088648902047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,65536,2.1190257602267795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,4096,0.1220746702618069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,3072,0.06745866934458415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,4096,0.14670133590698242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,2560,0.05730399820539686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,3584,0.10811289151509602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,3584,0.1329208877351549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,3072,0.09778666496276855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,2560,0.08313244581222534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,2560,0.10302755567762588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,51200,1.6796613269382055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,1536,0.03433155682351854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,2048,0.06874844763014051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,1024,0.025340444511837427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,2048,0.09122666385438706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,768,0.02219555609756046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,1536,0.05430044399367439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,1536,0.07613333066304524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,1024,0.04209066761864556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,1024,0.059170663356781006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,512,0.01908888916174571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,768,0.035438223017586604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,768,0.05081955591837565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,256,0.014700444208251106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,512,0.045316444502936475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,512,0.02881511052449544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,128,0.01000088867213991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,256,0.035734222994910345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,64,0.01178311142656538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,128,0.03286755416128371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,32,0.012088889049159156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,64,0.02437244521247016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,32,0.02382044494152069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,10240,3072,0.11818844742245144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,6144,0.1144568920135498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,65536,0.8752657572428385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,256,0.025407999753952026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,10240,128,0.024332443873087566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,16384,0.23401154412163627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,51200,0.6850453482733833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,10240,2048,0.044222222434149853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,12288,0.16846666071150038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,16384,0.4175111187828912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,65536,1.7724115583631728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,10240,0.15140710936652288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,16384,0.5054355727301704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,51200,1.4008053673638239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,12288,0.3733537726932102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,10240,0.2557315561506483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,8192,0.1330933305952284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,10240,0.31002312236362034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,7168,0.11713955137464736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,8192,0.20066222879621717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,8192,0.24830044640435112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,7168,0.17758133676317003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,65536,1.9269741906060114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,7168,0.22661511103312174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,5120,0.08711110883288914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,51200,1.5112924575805664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,4096,0.07172889179653592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,6144,0.19228088855743408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,5120,0.1308106713824802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,12288,0.3100515471564399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,3584,0.053103112512164645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,5120,0.16756888230641684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,3072,0.04602933261129591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,4096,0.10635022322336833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,4096,0.13640799787309435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,2560,0.04235377907752991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,3584,0.09672711292902629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,3584,0.12320889366997613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,2048,0.034167998366885714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,3072,0.08502311176723903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,1536,0.026361778378486633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,2560,0.09552177455690171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,2560,0.07300621933407254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,2048,0.060211552513970264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,1024,0.01940799918439653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,1536,0.0484479996893141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,1536,0.06823111242718168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,768,0.016011555989583332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,1024,0.05567555295096504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,1024,0.037760890192455716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,512,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,6144,0.10001689195632935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,256,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,768,0.030883553955290053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,512,0.025565332836574976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,512,0.040757334894604154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,128,0.01036533299419615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,256,0.022636445032225713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,6144,0.15284621715545654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,64,0.009644444617960189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,8192,32,0.009644444617960189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,128,0.02955377764172024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,64,0.02166044380929735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,32,0.021571555071406897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,3072,0.10964444610807632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,2048,0.08267822530534533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,65536,0.8652604420979818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,768,0.047563556167814464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,8192,256,0.034103999535242714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,51200,0.6752844386630588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,8192,128,0.02197955548763275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,16384,0.24346399307250977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,12288,0.18520355224609375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,16384,0.3882586691114638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,12288,0.2887626753913032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,65536,1.6315075556437175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,10240,0.14982488420274523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,51200,1.266056908501519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,8192,0.11942933665381537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,10240,0.2377502123514811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,16384,0.463314692179362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,12288,0.34775911437140566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,7168,0.10927377806769477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,6144,0.09334933095508152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,8192,0.18716888957553438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,10240,0.2914915614657932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,7168,0.16547021600935194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,8192,0.23244267039828828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,7168,0.20494666364457872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,5120,0.07710666788948907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,4096,0.06275377670923869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,6144,0.14223821957906088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,6144,0.17918044990963408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,5120,0.1213644478056166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,3584,0.056277334690093994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,65536,1.7807759179009333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,4096,0.12775288687811956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,3584,0.08928533395131429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,3584,0.11490755610995823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,51200,1.3983511394924586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,2560,0.04129244552718268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,3072,0.10388266377978855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,2048,0.03397599856058756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,2560,0.08986044592327541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,2048,0.0562666654586792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,2048,0.07766577932569715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,1536,0.02663999961482154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,1536,0.04523200127813551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,1536,0.06400177876154582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,1024,0.020428443948427837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,1024,0.03511910968356662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,5120,0.15335378381941053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,1024,0.05239822136031257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,768,0.016597333881590102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,512,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,4096,0.09935288959079319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,768,0.04522844486766391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,768,0.02915289004643758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,3072,0.04788177874353197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,256,0.00904977818330129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,512,0.02404266595840454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,512,0.03944355580541823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,128,0.008302222523424361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,64,0.0069546666410234236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,256,0.03254400028122796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,256,0.021299555897712708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,7168,128,0.029355555772781372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,7168,32,0.009365333451165093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,128,0.02058844433890449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,64,0.02065333392884996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,2560,0.0680017802450392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,32,0.020353777541054618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,51200,0.48979642656114364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,65536,0.5920222070482042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,16384,0.17950667275322807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,16384,0.38047289848327637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,7168,3072,0.07955733272764418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,12288,0.11877866586049397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,51200,1.1770168940226238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,12288,0.26628979047139484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,65536,1.4865164226955836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,12288,0.3253520064883762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,10240,0.21846755345662436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,8192,0.09867378075917561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,51200,1.2879698011610243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,10240,0.2675440046522352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,7168,0.07978666490978666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,6144,0.07072177860471937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,8192,0.17310667037963867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,8192,0.21396444903479683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,7168,0.1522266732321845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,5120,0.06130933099322849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,7168,0.19029422601064047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,65536,1.644360860188802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,6144,0.13140088982052273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,4096,0.04895822207132975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,6144,0.16560178332858616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,3584,0.04372266597217984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,5120,0.1120248900519477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,5120,0.14208622773488364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,4096,0.09222844574186538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,3072,0.03897422220971849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,4096,0.11890844504038493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,2560,0.0324906673696306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,3584,0.10746488968531291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,10240,0.11263999674055312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,2048,0.024703999360402424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,16384,0.4410097863939073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,3072,0.09542400307125515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,2560,0.06224977970123291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,2560,0.08283022377226087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,1024,0.015038222074508667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,2048,0.07221244441138373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,1536,0.041344000233544245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,1536,0.059989333152770996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,768,0.012774222426944308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,1024,0.03279022375742594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,1024,0.049550222025977246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,512,0.009349333743254343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,768,0.04126755396525065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,768,0.027349332968393963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,256,0.0074337778819931885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,512,0.022686221533351477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,512,0.03543377916018168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,128,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,256,0.019896888070636325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,128,0.019544000426928203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,64,0.006217777729034424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,64,0.019270223047998216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,32,0.0064560001095136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,3584,0.08155555857552423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,3072,0.07050666544172499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,32,0.01921244462331136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,6144,1536,0.020255110330051847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,6144,2048,0.05198311143451267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,65536,0.5396657519870335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,51200,0.45429420471191406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,256,0.03200088938077291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,16384,0.16354578071170384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,6144,128,0.027705777022573683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,12288,0.1224551068411933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,16384,0.32905954784817165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,12288,0.24518489837646484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,51200,1.0714604059855144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,65536,1.3702551523844402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,16384,0.4371155632866754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,10240,0.10748444663153754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,8192,0.08685155709584554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,12288,0.31991733445061576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,10240,0.20142222775353325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,7168,0.07726222276687622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,8192,0.15768088234795466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,10240,0.26361510488722056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,6144,0.0634933312733968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,7168,0.13894311587015787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,7168,0.1882702244652642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,5120,0.05212444398138258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,6144,0.12131644619835748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,4096,0.04323644439379374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,6144,0.16444178422292074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,65536,1.624946700202094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,5120,0.1028675569428338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,5120,0.14011111524369982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,51200,1.2725768619113498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,3072,0.03460622164938185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,4096,0.11760355366600884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,2560,0.029785778787400987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,3584,0.10589066478941177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,3584,0.07419911358091566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,3072,0.09420622057384914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,3072,0.06632355848948161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,2048,0.02481866710715824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,1536,0.019761777586407132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,2560,0.055504000849194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,2560,0.08205155531565349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,1024,0.0155395550860299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,2048,0.07147555881076388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,1536,0.05919288926654392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,768,0.012835555606418185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,1024,0.03051111102104187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,768,0.025075554847717285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,768,0.041913777589797974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,512,0.00941955546538035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,512,0.03479111194610596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,256,0.00758844448460473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,3584,0.03927822245491876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,256,0.0188719994492001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,4096,0.08460978004667495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,128,0.006623999940024481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,256,0.030525333351559106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,64,0.006631111105283101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,128,0.027169777287377253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,128,0.018227555685573153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,5120,32,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,64,0.017906667457686532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,32,0.017723555366198223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,2048,0.04763111140992907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,1536,0.03838488790724013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,1024,0.04713866776890225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,65536,0.4941600163777669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,5120,8192,0.2142417828241984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,51200,0.4094231128692627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,16384,0.13433599472045898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,5120,512,0.021363554729355708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,12288,0.10256799724366929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,16384,0.3004693455166287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,12288,0.22228977415296766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,10240,0.0927199986245897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,16384,0.40300710995992023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,51200,0.9588676028781467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,8192,0.07571911149554782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,65536,1.2215795516967773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,10240,0.1850737730662028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,10240,0.24117689662509492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,7168,0.06336889002058241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,6144,0.05093155635727776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,8192,0.19600533114539254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,7168,0.1281928883658515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,7168,0.17272978358798555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,6144,0.11107466618220012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,5120,0.04220799936188591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,6144,0.15183022287156847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,4096,0.03481866584883796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,51200,1.1631288528442383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,3584,0.03263288736343384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,5120,0.09538933303621079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,5120,0.1293048858642578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,65536,1.4844951629638672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,4096,0.10747733381059434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,3072,0.028016000986099243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,3584,0.07006488906012641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,2560,0.02437244521247016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,3072,0.08711466524336074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,3072,0.06153511338763767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,2048,0.020541333489947848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,2560,0.07589599821302626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,2560,0.05123910970158047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,12288,0.30869245529174805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,1536,0.014294221997261047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,2048,0.06612533330917358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,2048,0.04344800114631653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,1024,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,1536,0.05583110782835218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,1536,0.035655998521380954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,768,0.009640889035330879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,1024,0.043623109658559166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,1024,0.027101332942644756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,512,0.00794577764140235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,768,0.02315644423166911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,256,0.0069306666652361555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,512,0.03334133492575751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,512,0.019892444213231403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,128,0.005927111125654644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,256,0.017271111408869427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,256,0.029576000240114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,64,0.006934222247865465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,128,0.02643644478585985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,128,0.017161778277821012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,4096,32,0.00720088928937912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,3584,0.09765599833594428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,64,0.01681777834892273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,32,0.01647822227742937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,65536,0.4464755588107639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,8192,0.14549867312113443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,4096,768,0.038763556215498186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,16384,0.12290933397081162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,4096,4096,0.079148444864485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,65536,1.1701022254096138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,16384,0.28773511780632866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,12288,0.09075822432835896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,51200,0.9173644383748373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,10240,0.0834382242626614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,12288,0.215009782049391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,16384,0.386957327524821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,8192,0.06805244419309828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,51200,0.3399866686926947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,12288,0.2908053398132324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,10240,0.176200893190172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,65536,1.4748409059312608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,7168,0.058506667613983154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,10240,0.24029511875576445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,6144,0.05116888880729675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,8192,0.1383555597729153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,51200,1.1584053039550781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,8192,0.1928622192806668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,7168,0.12213510937160915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,4096,0.03337422344419692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,6144,0.10719377464718288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,6144,0.1499511135949029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,5120,0.09110044770770603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,3584,0.03072711163096958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,4096,0.07509599791632758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,4096,0.10716799894968669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,3072,0.026701332794295415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,3584,0.0968995557890998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,3584,0.06745600038104586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,2560,0.02316711180739933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,2048,0.01980266637272305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,3072,0.0579377810160319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,2560,0.04907377892070346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,2560,0.07562577724456787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,1536,0.01588622232278188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,2048,0.06595466534296672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,2048,0.04148177636994256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,1024,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,1536,0.03413866625891791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,1536,0.05533688929345873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,768,0.009081777599122789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,1024,0.026294221480687458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,512,0.007270221908887227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,768,0.022461333208613928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,768,0.03771022293302748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,256,0.006254222244024277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,512,0.019256000717480976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,5120,0.041906668080223926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,512,0.032525334093305804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,128,0.00555377784702513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,7168,0.1713235510720147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,64,0.005211555709441503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,256,0.029155555698606703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,128,0.025361778007613286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3584,32,0.005128889034191768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,5120,0.12791289223564997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,128,0.01648977730009291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,64,0.016141333513789706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,32,0.015809777710172866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,3072,0.0869377785258823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,65536,0.37558576795789933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,51200,0.3163591225941976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,16384,0.10514933533138698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3584,1024,0.04385155439376831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,16384,0.29005689091152614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,12288,0.07559466361999512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3584,256,0.016876444220542908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,51200,0.8525279892815484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,16384,0.351398229598999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,10240,0.05927911069658068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,12288,0.20629689428541395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,8192,0.04758488800790575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,12288,0.26442133055792916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,10240,0.1666897800233629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,7168,0.042562666866514415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,65536,1.3405670589870875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,51200,1.0518329408433702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,8192,0.1321386628680759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,6144,0.03734222385618422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,8192,0.175491558180915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,5120,0.03131822082731459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,7168,0.11538667149013943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,7168,0.15610667069753012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,6144,0.1005893349647522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,6144,0.13706221845414904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,4096,0.026351999905374315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,3584,0.022967111733224656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,5120,0.08619911140865749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,5120,0.11773778332604302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,4096,0.07078755564159818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,3072,0.020224000016848247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,4096,0.09821066591474746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,3584,0.06289600001441108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,3584,0.08909422159194946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,65536,1.0910675260755751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,3072,0.07982755369610257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,3072,0.053736888700061373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,2048,0.015156444576051501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,1536,0.01236355553070704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,2560,0.04610933197869194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,2560,0.06964977582295735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,1024,0.009690666364298927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,2048,0.060771558019849986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,2048,0.03945511248376634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,768,0.008298666940795051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,1024,0.02478844424088796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,1024,0.04054311248991225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,512,0.006973333656787872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,768,0.02126400007141961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,10240,0.21828977266947427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,256,0.005535111245181825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,512,0.03151911165979173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,512,0.018523555662896898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,256,0.027608889672491286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,256,0.016182222300105624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,64,0.004589333302444882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,128,0.015853333804342482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,128,0.024309333827760484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,32,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,64,0.015469332536061605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,32,0.015184000134468079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,2560,0.017609778377744887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,65536,0.3346284495459662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,51200,0.26717956860860187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,1536,0.05055911011166043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,16384,0.09005333317650689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,3072,768,0.035410665803485446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,3072,128,0.004865777575307422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,65536,1.0324968761867948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,16384,0.25918756590949166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,12288,0.06384978029463026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,10240,0.05079288946257698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,16384,0.3503742218017578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,12288,0.19333688418070474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,12288,0.26377420955234104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,10240,0.15870489014519587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,8192,0.04213066564665901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,7168,0.037455999188952975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,10240,0.2178542216618856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,65536,1.3341591093275282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,8192,0.1248026688893636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,8192,0.1759857734044393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,51200,1.0460649066501193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,7168,0.1100533339712355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,3072,1536,0.03128355410363939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,5120,0.028402666250864666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,7168,0.1554702255460951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,4096,0.02457422183619605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,6144,0.1364026731914944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,6144,0.09540888998243545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,5120,0.11668977472517227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,5120,0.08108711242675781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,4096,0.06708444489373101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,3072,0.019308444526460435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,4096,0.09804888566335042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,2560,0.016711999972661335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,3584,0.059501330057779946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,3584,0.08858578072653876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,3072,0.07925599813461304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,2048,0.014679999815093147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,2560,0.04392177859942118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,2560,0.06907466385099623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,51200,0.8210684458414713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,1536,0.012063110868136087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,2048,0.03678488731384277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,1024,0.00960177762640847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,2048,0.06052622530195448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,1536,0.03051466743151347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,768,0.008279999925030602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,1024,0.04019200139575534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,768,0.020602666669421725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,768,0.035304887427224055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,512,0.007143110864692264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,6144,0.03280444608794318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,512,0.03122399912940131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,512,0.017913776967260573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,256,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,128,0.005201777650250329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,256,0.015590222345458137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,3584,0.021532444490326777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,64,0.004868444469239977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,128,0.015065777632925244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,128,0.02501511077086131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2560,32,0.005562666803598404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,64,0.014774221513006421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,3072,0.05162222186724345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,32,0.014771555860837301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,65536,0.2533804575602214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,51200,0.21488711569044325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,1536,0.051144000556733876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,16384,0.06962133116192289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2560,1024,0.023800889650980633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,16384,0.24636265966627333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,12288,0.05094044407208761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,16384,0.3483555581834581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2560,256,0.02811644474665324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,51200,0.7670755386352539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,65536,0.9840941958957248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,10240,0.04585422078768412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,8192,0.0356026656097836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,12288,0.1842355595694648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,10240,0.15147199895646837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,12288,0.26297688484191895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,10240,0.21688000361124674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,7168,0.029389331738154095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,8192,0.11927021874321832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,6144,0.026354667213228013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,8192,0.17442933718363443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,5120,0.02372444503837162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,7168,0.10453333457310994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,51200,1.047646204630534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,65536,1.3229591581556532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,7168,0.15487999386257595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,6144,0.09116266833411323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,4096,0.019832000136375427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,3584,0.017753778232468497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,5120,0.07750488652123345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,5120,0.11582844787173802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,4096,0.09726488590240479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,3072,0.01573244399494595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,4096,0.06342222293217976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,3584,0.05585600270165337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,3584,0.0882951087421841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,2048,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,3072,0.04854844344986809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,3072,0.07813866933186848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,2560,0.041582223441865705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,2560,0.06915111011928983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,1536,0.009648000200589498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,1024,0.007706666986147563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,2048,0.03547733359866672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,2048,0.058928887049357094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,1536,0.02883022361331516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,768,0.006693333387374878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,1024,0.023005333211686876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,1024,0.04013777772585551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,512,0.0058853332367208265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,768,0.03525688913133409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,768,0.019686222076416016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,256,0.004868444469239977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,512,0.031165334913465712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,512,0.017204445269372728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,128,0.004527111020353106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,256,0.027387556102540758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,64,0.004247111164861255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,128,0.02439466615517934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,32,0.0041866666740841335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,64,0.014160888062583076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,6144,0.13548444377051458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,32,0.014094221923086377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,65536,0.19879021909501818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,2048,2560,0.014067555467287699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,51200,0.16993155744340685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,16384,0.055014222860336304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,2048,1536,0.048807998498280845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,16384,0.22877600457933214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,12288,0.03808800048298306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,51200,0.7023528946770562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,65536,0.8957173029581705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,256,0.015167999598715039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,16384,0.3128097852071126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,12288,0.17071999443901908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,10240,0.03249866763750712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,2048,128,0.014579556054539151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,8192,0.02595377796226078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,12288,0.23557421896192762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,7168,0.02346311178472307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,51200,0.9320844014485677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,10240,0.1944026682111952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,8192,0.10525866349538167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,8192,0.15610755814446345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,6144,0.020647999313142564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,5120,0.017495999733606975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,7168,0.09577777650621201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,7168,0.13904000653160944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,6144,0.12194932831658258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,6144,0.07887555493248834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,4096,0.015104000767072042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,3584,0.01330311099688212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,5120,0.0710666643248664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,5120,0.10452355278862847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,3072,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,4096,0.08814489179187351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,4096,0.05749511056476169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,2560,0.010614222122563256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,3584,0.049984001451068454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,3584,0.08016000191370647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,2048,0.009296889106432596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,3072,0.04412800073623657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,3072,0.07191377878189087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,1536,0.007644444704055786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,2560,0.062900443871816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,2048,0.032519999477598406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,2048,0.053789334164725415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,1024,0.006254222244024277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,1536,0.04489511251449585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,1536,0.027007111244731482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,768,0.005607999861240387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,1024,0.03712622324625651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,1024,0.02130222154988183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,512,0.004851555658711327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,768,0.03291911217901442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,256,0.0042160000238153665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,512,0.016145777371194627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,512,0.029463112354278564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,65536,1.1857368681165907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,128,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,256,0.014470222923490735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,256,0.026131555438041687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,64,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1536,128,0.02347466680738661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1536,32,0.0038817777401871155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,128,0.013790222505728403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,64,0.013731555806265937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,32,0.013461333182122974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,65536,0.15707111358642578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,51200,0.12594132953219944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,2560,0.038281778494517006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,16384,0.04020444552103678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,51200,0.6557946734958225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,768,0.018523555662896898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,65536,0.8360977702670627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,16384,0.21702044539981416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1536,10240,0.1400079992082384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,12288,0.029727111260096233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,10240,0.02421244482199351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,12288,0.16097511185540095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,10240,0.13082222143809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,12288,0.23382578955756295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,8192,0.01993600030740102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,10240,0.19383645057678223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,7168,0.017825777331988018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,51200,0.9261706670125326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,65536,1.178558243645562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,6144,0.015999999311235216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,8192,0.10322133037779067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,8192,0.15536888440450033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,5120,0.014288889037238227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,7168,0.137992885377672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,4096,0.012117333710193634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,6144,0.07823022206624348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,6144,0.12116977903578018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,3584,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,5120,0.06670133272806804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,5120,0.10417866706848145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,3072,0.010040000081062317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,4096,0.053063111172782056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,4096,0.08714844120873345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,2560,0.0086666668454806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,3584,0.046588444047504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,3584,0.0791520012749566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,2048,0.00793333351612091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,3072,0.042113777663972646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,3072,0.07059644328223334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,1536,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,2560,0.061455110708872475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,2560,0.03494488861825731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,2048,0.030200001266267564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,1024,0.005558222118351195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,2048,0.05486844314469231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,768,0.004915555732117759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,1536,0.025011556016074285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,1024,0.020280000236299302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,1024,0.03714399867587619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,512,0.0042364444169733255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,768,0.01757066614098019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,768,0.031897776656680636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,256,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,16384,0.3105084366268582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,512,0.015465777781274585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,128,0.003879111260175705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,256,0.013758222262064615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,256,0.02604266670015123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,64,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,1024,32,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,128,0.022987556126382615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,7168,0.09042577611075507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,64,0.013015111287434896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,32,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,65536,0.12112088998158772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,51200,0.10449955860773723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,1536,0.04464711083306206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,16384,0.030360887447992962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,51200,0.6247866418626573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,65536,0.7954488860236274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,12288,0.022357333037588332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,1024,512,0.02881066666709052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,16384,0.20624089241027832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,10240,0.018977777825461496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,1024,128,0.013415111435784234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,12288,0.15394666459825304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,16384,0.3071262306637234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,8192,0.016007110476493835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,51200,0.9149689144558377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,65536,1.165869288974338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,12288,0.23199823167588976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,7168,0.014436443646748861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,6144,0.012670222255918713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,10240,0.12501688798268637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,8192,0.09795644548204209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,8192,0.15404089291890463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,5120,0.011038222246699862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,7168,0.13665955596499973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,4096,0.009699555734793345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,6144,0.075290666686164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,6144,0.12047021918826634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,3584,0.008745777938101027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,5120,0.06290311283535428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,5120,0.10319555468029445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,3072,0.007864000068770515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,4096,0.08649155828687881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,3584,0.045422222879197865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,3584,0.07882399691475762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,2560,0.007322666545708974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,2048,0.0063928887248039246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,3072,0.038986666334999934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,3072,0.07010933425691393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,1536,0.005632888939645555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,2560,0.06054400073157417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,2560,0.033562666840023465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,1024,0.004574222283230888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,2048,0.052687999274995595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,2048,0.028897778855429754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,768,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,1536,0.02400355537732442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,1536,0.044201778040991895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,512,0.0041777777175108595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,1024,0.03669955664210849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,1024,0.019899555378490023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,256,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,768,0.01683022247420417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,768,0.032285332679748535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,128,0.0035439998739295532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,512,0.029147555430730183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,256,0.026025777061780293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,256,0.013398222625255585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,64,0.0032213332338465583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,768,32,0.0032186667538351486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,128,0.023011555274327595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,768,10240,0.1907271146774292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,7168,0.08621511194441055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,64,0.012714666624863943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,65536,0.08848977751202053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,32,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,51200,0.06934577888912626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,16384,0.02630311085118188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,4096,0.050311999188529126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,16384,0.2048577732510037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,12288,0.028866665230857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,16384,0.30620000097486705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,51200,0.617054197523329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,65536,0.7868764665391711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,10240,0.02469066613250309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,12288,0.15277955267164442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,8192,0.020225778222084045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,12288,0.23124355740017363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,512,0.015150222513410779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,10240,0.12515200508965388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,7168,0.018212444252438016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,10240,0.19060266017913818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,768,128,0.012719111310111152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,8192,0.09726133611467148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,6144,0.016158221496476066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,8192,0.15352177619934082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,65536,1.1602747175428603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,7168,0.08546933200624253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,5120,0.014090667168299357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,4096,0.008994667066468133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,6144,0.0738088885943095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,6144,0.11995911598205566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,5120,0.0627617769771152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,5120,0.10247555706236099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,4096,0.049992889165878296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,4096,0.08581244283252293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,3072,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,3584,0.04421600037150913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,3584,0.07808622386720446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,2560,0.0069226668112807805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,3072,0.06971200307210286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,2048,0.005872000008821487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,2560,0.03385422295994229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,2560,0.05957688887914022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,1536,0.005200888961553574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,2048,0.028650667932298448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,2048,0.05237244566281637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,1024,0.004537777768241035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,1536,0.024043555061022442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,1536,0.04348088966475593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,51200,0.9113413492838541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,768,0.0041804446114434134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,1024,0.036335110664367676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,1024,0.01956977778010898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,512,0.0036115555299652945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,768,0.03185955683390299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,768,0.016819554898473952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,512,0.014896889527638754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,7168,0.13625778092278376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,512,0.02875466810332404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,128,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,256,0.02606666584809621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,3584,0.008298666940795051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,128,0.012721777790122561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,512,128,0.022670222653283015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,32,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,65536,0.05197599861356947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,64,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,32,0.012521777715947894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,3072,0.03916977842648824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,65536,0.7474604182773166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,51200,0.5862737761603461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,256,0.0032186667538351486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,16384,0.01720355616675483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,512,256,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,512,64,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,12288,0.01516711049609714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,16384,0.1948008934656779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,65536,1.1542684766981337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,10240,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,12288,0.14546399646335179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,51200,0.04222666554980808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,8192,0.01312888910373052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,12288,0.23054220941331652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,7168,0.012099555797047086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,10240,0.11843289269341363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,10240,0.1898639996846517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,6144,0.010631110933091907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,8192,0.09192888604270087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,8192,0.15290844440460205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,7168,0.08045688602659437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,5120,0.009304000271691216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,51200,0.9075164794921875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,4096,0.008231999973456064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,6144,0.06947822040981717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,6144,0.11921332942114936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,3584,0.007634667058785756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,5120,0.058837334314982094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,5120,0.10194577773412068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,4096,0.04681866698794895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,3072,0.007796444826655918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,4096,0.08558311065038045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,2560,0.006599111275540457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,3584,0.04191022117932638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,3584,0.07731555567847358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,2048,0.005589333259397083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,3072,0.0368115570810106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,2560,0.059198220570882164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,2560,0.03151111139191522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,1536,0.005187555733654234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,1024,0.004173333446184794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,2048,0.02711822258101569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,2048,0.05195377932654487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,1536,0.04325422313478258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,768,0.0038844446341196695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,1536,0.022970666488011677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,16384,0.30494221051534015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,512,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,1024,0.03600088755289713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,1024,0.018530666828155518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,256,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,768,0.03186755710177951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,768,0.016180444094869826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,512,0.028255999088287354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,128,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,512,0.014125333891974555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,256,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,64,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,256,0.025399999486075506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,256,32,0.002855111120475663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,128,0.022634666826989915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,128,0.012115555504957834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,64,0.011760888828171624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,7168,0.13589510652754042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,51200,0.03332355618476868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,256,3072,0.06729244523578219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,16384,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,51200,0.5851510895623101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,65536,0.7459475729200574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,12288,0.011398221883508893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,16384,0.1949839989344279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,51200,0.9051360024346246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,12288,0.1445324420928955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,16384,0.3039982318878174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,10240,0.01053600013256073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,65536,1.1504906548394096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,8192,0.009348444640636444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,65536,0.04159644577238295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,7168,0.008970666262838576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,12288,0.23025245136684844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,256,32,0.012079111403889127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,10240,0.11722044150034587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,6144,0.00868444475862715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,10240,0.18947111235724556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,8192,0.15279377831353083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,5120,0.008301333420806462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,7168,0.07964799801508586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,7168,0.13587466875712076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,4096,0.007616000043021307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,6144,0.06917422347598605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,6144,0.11893155839708115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,3584,0.006980444822046492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,5120,0.057982219590081104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,5120,0.10179999801847671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,3072,0.006510222123728857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,4096,0.04640266630384657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,4096,0.08517066637674968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,2560,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,3584,0.041160000695122614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,3584,0.07574755615658231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,2048,0.005527110977305307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,3072,0.03571288784344991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,3072,0.0685066646999783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,1536,0.004871110949251386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,2560,0.031152000029881794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,2560,0.058952887852986656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,1024,0.0041884444653987885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,2048,0.027112000518374976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,2048,0.051721778180864125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,768,0.0038284444146686127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,1536,0.043402665191226535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,512,0.003559999995761447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,1024,0.03568799959288703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,768,0.016172443826993305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,256,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,512,0.014116444521480136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,128,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,256,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,256,0.02475111186504364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,64,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,128,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,128,0.022050667140218947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,128,32,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,8192,0.09124355845981175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,64,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,65536,0.038873778449164495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,51200,0.03420089019669427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,32,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,16384,0.01276177747382058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,12288,0.011032889286677042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,16384,0.19470132721794975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,12288,0.14450489150153265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,10240,0.01000711073478063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,8192,0.008995555341243744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,1536,0.022678222921159532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,51200,0.5848862330118815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,10240,0.11786577436659072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,128,1024,0.018592000007629395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,65536,0.7457911173502604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,6144,0.008287111090289222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,768,0.03154844376775954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,5120,0.007896000312434303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,4096,0.007640000018808577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1536,128,512,0.02781244450145298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,3584,0.007270221908887227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,7168,0.07977066437403361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,3072,0.0063786668082078295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,5120,0.05843822161356608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,4096,0.04584622383117676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,2048,0.005252444495757421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,3072,0.03497066762712266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,2560,0.031230221192042034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,1536,0.004556444370084339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,2048,0.027103111147880554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,1024,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,1536,0.022647110952271357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,768,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,1024,0.018592889110247295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,512,0.0032071111102898917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,768,0.016120000018013846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,256,0.0032044444233179092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,512,0.014373333917723762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,128,0.0027955555253558685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,7168,0.008983111215962304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,256,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,64,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,8192,0.09140177567799886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,32,0.0025395556456512874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,128,0.012094222009181976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,65536,0.03594311078389486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,64,0.011713777979214987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,51200,0.029862221744325426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,6144,0.06926755772696601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,16384,0.009332444104883406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,12288,0.008016889293988546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,3584,0.04118044508828057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,10240,0.016182222300105624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,16384,0.19430222776201037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,12288,0.14465955893198648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,8192,0.013975110318925647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,7168,0.013066666821638743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,10240,0.11739467249976264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,6144,0.011943110989199745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,51200,0.585394647386339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,65536,0.7456489139133029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,7168,0.07959644662009345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,5120,0.01072088877360026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,4096,0.009678222239017487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,6144,0.06879111131032307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,3584,0.009034666750166152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,3072,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,5120,0.05812622441185845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,4096,0.04591022266281975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,2560,0.005614222337802251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,2048,0.005565333283609814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,3072,0.03560444381501939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,1536,0.004538666870858935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,2560,0.03122399912940131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,1024,0.003908444609906939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,2048,0.027124444643656414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,64,32,0.011830222275522021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,64,2560,0.005920889063013925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,512,0.0034862222770849862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,768,0.016159999701711867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,256,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,512,0.014110222458839417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,128,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,256,0.012464000119103326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,64,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,128,0.0120328888297081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,32,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,8192,0.09116355578104655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,32,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,3584,0.041165331999460854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1536,32,768,0.0035502223504914176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,1536,0.022687999738587275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,1024,0.018581334087583754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1536,32,64,0.011917333636018964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,12288,1.3428897857666016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,16384,1.7757813135782878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,12288,1.4087350633409288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,10240,1.186828401353624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,10240,1.1853289074367948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,16384,1.9918265872531469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,8192,0.7959849039713541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,7168,0.6864542431301541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,6144,0.5562311278449165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,5120,0.5295564333597819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,7168,0.8167520099216037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,6144,0.6746702194213867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,4096,0.4077626599205865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,5120,0.6218826505872939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,3584,0.37790844175550675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,3584,0.3957306543986003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,3072,0.30511734220716685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,3072,0.34509778022766113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,4096,0.48213153415256077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,2048,0.213119109471639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,1536,0.16603110896216497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,2560,0.29103467199537486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,8192,0.9487893846299914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,1024,0.10445688830481635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,2048,0.2426719930436876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,768,0.08894311057196723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,512,0.06059110826916165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,1536,0.19975554943084717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,1024,0.1463760005103217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,256,0.045977777904934354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,768,0.12753510475158691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,128,0.042303111818101674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,64,0.038650665018293597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,512,0.10094488991631402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,256,0.09256711271074082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,32,0.04109422365824381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,128,0.08583111233181423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,64,0.08557599782943726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,32,0.08598844210306804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,51200,5.453836652967666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,65536,2560,0.2699351045820448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,65536,51200,6.860735151502822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,16384,1.3624898062811956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,16384,1.5909795761108398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,10240,0.7866969108581543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,12288,1.0027955373128254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,12288,1.1810311211480033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,8192,0.6576853328280979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,51200,4.025382147894965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,10240,0.9453581704033746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,8192,0.7506462203131782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,7168,0.5986293156941732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,6144,0.5012044376797146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,6144,0.5490942001342773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,5120,0.4173297882080078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,65536,5.181104024251302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,7168,0.6364497608608669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,4096,0.32092444101969403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,5120,0.5328942404852973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,3584,0.28008445103963214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,4096,0.3657200071546767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,3072,0.22084621588389078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,2560,0.22267201211717394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,2048,0.15182667308383518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,51200,5.406943851047092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,3072,0.2827235592736138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,1536,0.12859643830193415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,2048,0.19428622722625732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,2560,0.24978221787346733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,768,0.0706275569068061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,1536,0.1646302276187473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,3584,0.3318008846706814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,1024,0.11955111556582981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,256,0.03872888949182298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,128,0.03462222218513489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,768,0.09483822186787923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,512,0.0965848896238539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,64,0.03295822276009454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,256,0.07555466890335083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,32,0.04066488809055752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,128,0.07135999865002103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,64,0.07003021902508207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,32,0.07045688894059923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,16384,0.4127297666337755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,1024,0.09775466389126247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,51200,512,0.05024622215165032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,12288,0.29096799426608616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,51200,65536,7.592274983723958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,51200,1.334274715847439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,16384,0.5854453510708278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,12288,0.4181022114223904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,10240,0.2442479928334554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,8192,0.22132089402940539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,65536,1.7800000508626301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,8192,0.2763600084516737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,7168,0.17431999577416313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,10240,0.3598799970414903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,6144,0.16274578041500515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,7168,0.24753332138061523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,5120,0.17753333515591094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,6144,0.23418045043945312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,51200,2.0615289476182723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,4096,0.1478417714436849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,3072,0.08535022205776638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,2560,0.0752355522579617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,3584,0.12794221772087946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,2048,0.05966666671964857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,3072,0.11334755685594346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,1536,0.04689777890841166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,65536,2.5387280782063804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,1024,0.03408622079425388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,2048,0.0820337798860338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,768,0.026391999589072332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,1536,0.06578044758902656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,512,0.020616888999938965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,256,0.01575911045074463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,1024,0.05123466584417555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,768,0.041555556986067034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,128,0.01309333327743742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,512,0.03421955638461643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,256,0.031023999055226643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,64,0.011375111010339526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,32,0.011520889070298938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,128,0.029117332564459905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,64,0.029164443413416546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,5120,0.1396977769003974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,32,0.028705779049131606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,3584,0.10042311085595025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,16384,0.31564532385932076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,16384,2560,0.09888444344202678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,12288,0.24123644828796387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,16384,0.47264888551500106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,51200,0.8199697600470649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,10240,0.2103724479675293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,12288,0.3411688804626465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,8192,0.17107910580105254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,10240,0.28125866254170734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,7168,0.14878400166829428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,8192,0.22579556041293672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,6144,0.12743733988867864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,7168,0.1980604463153415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,5120,0.10783111386828953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,51200,1.5445867114596898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,6144,0.17233778370751274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,4096,0.08359644148084854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,3584,0.06476710902320014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,5120,0.14586577150556776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,4096,0.11954132715861003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,3072,0.06268355581495497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,65536,1.9881528218587239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,3584,0.11857155958811443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,2560,0.05105066630575392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,2048,0.04312888781229655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,1536,0.03352800011634827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,3072,0.09365510940551758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,2560,0.08136000235875447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,1024,0.025010666913456384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,768,0.01925066610177358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,2048,0.0698488884501987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,512,0.01514311134815216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,1536,0.05351644423272875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,256,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,1024,0.041800889703962535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,65536,1.267330699496799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,768,0.034803556071387395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,128,0.010053333308961656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,512,0.029912889003753662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,64,0.008919999831252629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,12288,32,0.009299555586444007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,256,0.02574577762020959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,16384,4096,0.10868177811304729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,128,0.02472711106141408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,64,0.024672889047198828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,12288,32,0.02506133251720005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,16384,0.23756088150872123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,12288,0.2037066618601481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,10240,0.17828799618615043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,16384,0.4130942291683621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,51200,0.7501297526889377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,12288,0.3100328975253635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,65536,1.0227013693915474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,7168,0.1217128833134969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,10240,0.27341243955824107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,6144,0.10023733642366196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,8192,0.22909598880343965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,5120,0.08779378069771661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,6144,0.15980533758799234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,7168,0.19292799631754556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,4096,0.06718933582305908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,3584,0.0641875531938341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,5120,0.13442933559417725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,51200,1.3623581992255316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,3072,0.05535466803444756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,4096,0.10780533154805501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,2560,0.048940443330340914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,3584,0.09747644265492757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,2048,0.03874489002757602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,1536,0.028637333048714533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,3072,0.08726666371027629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,2560,0.07432978020773993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,1024,0.02160355614291297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,65536,1.7743573718600805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,768,0.017430222696728177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,2048,0.06044355365965101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,1536,0.04888977938228183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,512,0.01447111037042406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,128,0.009180444810125563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,1024,0.03844711184501648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,768,0.0319164428446028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,64,0.007996444072988298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,8192,0.14398222499423557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,256,0.010341333018408881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,128,0.023003555006451074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,64,0.02255200015174018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,32,0.022297778063350256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,51200,0.6048933135138618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,65536,0.8476897875467936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,16384,0.2263537777794732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,12288,0.17522754934098986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,512,0.026994667119450037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,16384,0.3598968982696533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,10240,32,0.008346666892369589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,10240,0.1742080052693685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,8192,0.12308622731102838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,51200,1.1705350875854492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,12288,0.2874942090776232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,7168,0.12295288509792751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,10240,0.21709244781070283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,6144,0.08750577767690022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,8192,0.174072888162401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,65536,1.5195022159152562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,5120,0.08912355369991726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,7168,0.15537510977851018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,4096,0.0662248863114251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,3584,0.06020000245836046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,6144,0.13688622580634222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,3072,0.05185155404938591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,4096,0.09304355250464545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,5120,0.11341510878668891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,3584,0.0863484475347731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,2048,0.035394665267732404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,3072,0.07525244686338636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,1536,0.02879377868440416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,1024,0.018072888255119324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,2560,0.06355022059546576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,768,0.0166311115026474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,2048,0.05358844333224826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,512,0.01202400028705597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,1536,0.04298311140802172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,256,0.009320889082219865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,1024,0.035029331843058266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,128,0.007600888609886169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,64,0.006575111299753189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,768,0.028387556473414104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,512,0.024362666739357844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,256,0.021291555629836187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,32,0.006622222148709827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,128,0.020587555236286588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,64,0.020273778173658583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,8192,32,0.020281778441535104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,10240,256,0.023373333944214716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,16384,0.20897244082556832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,16384,0.3358924388885498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,12288,0.16494488716125488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,51200,0.6341733402676052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,8192,2560,0.044812444183561534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,65536,0.7488489151000977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,10240,0.12527555889553493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,7168,0.08724888828065659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,8192,0.09068355295393203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,12288,0.2449866665734185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,10240,0.23523910840352377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,8192,0.18337510691748726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,5120,0.0646524429321289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,7168,0.15667200088500977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,6144,0.12356889247894287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,4096,0.05350311266051399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,3584,0.04548089040650261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,5120,0.11275377538469102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,3072,0.03862399856249491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,65536,1.3857830895317926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,4096,0.09014399846394856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,2560,0.03306844499376085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,2048,0.027767111857732136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,3584,0.07789511150783963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,1536,0.02269511090384589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,1024,0.01763911048571269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,2560,0.059502224127451576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,2048,0.049545778168572314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,768,0.014820444915029736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,1536,0.04049688908788893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,512,0.011668444507651858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,256,0.008967999782827165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,768,0.026717333330048457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,512,0.02264444364441766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,128,0.007271111011505127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,256,0.020064888728989493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,64,0.00629688882165485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,32,0.006575999988449945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,128,0.0195795562532213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,64,0.01924622224436866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,32,0.018935999936527677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,7168,6144,0.06804888778262667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,51200,1.088915506998698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,16384,0.13957777288224962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,12288,0.10043644242816502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,51200,0.436459567811754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,10240,0.09495555692248875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,16384,0.3107093440161811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,3072,0.06940711206860013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,8192,0.07769155502319336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,12288,0.22634845309787324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,7168,1024,0.033019555939568415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,7168,0.06788000133302477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,10240,0.19810577233632407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,6144,0.05802222092946371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,5120,0.050092445479498975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,7168,0.13162577152252197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,4096,0.04059200154410468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,6144,0.11499644650353326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,3584,0.03636799918280707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,5120,0.09754666354921128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,65536,1.2796017328898113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,3072,0.031136890252431233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,2560,0.02721422248416477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,3584,0.07264177666770087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,4096,0.07939555247624715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,3072,0.06178222099939982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,1536,0.018616888258192275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,2560,0.05516977773772346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,1024,0.016295111841625638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,768,0.013716444373130798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,2048,0.04586933387650383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,1536,0.037294222248925105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,1024,0.030213332838482324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,512,0.00962755580743154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,65536,0.5396186510721842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,256,0.007632888853549957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,768,0.024528000089857314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,128,0.006631111105283101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,64,0.005576000031497743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,512,0.02128711177243127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,32,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,256,0.019162666466501024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,64,0.018557333283954196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,32,0.017866666118303936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,8192,0.14856266975402832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,51200,0.9991369247436523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,65536,0.48041688071356875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,16384,0.13724177413516575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,51200,0.3849528895484076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,6144,2048,0.023064000738991633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,12288,0.10644088851081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,10240,0.08924977646933661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,16384,0.295575115415785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,12288,0.21467999617258707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,10240,0.17105421755048963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,7168,0.05989155504438612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,6144,0.05064622229999966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,8192,0.13917511039310032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,65536,1.1472853554619682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,5120,0.0424231125248803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,4096,0.03616711166169908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,6144,0.1067075530687968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,3584,0.03103111187616984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,5120,0.09122311406665379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,3072,0.029677334758970473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,4096,0.0754622220993042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,2560,0.02330577704641554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,3584,0.06736799743440416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,2048,0.02012711101108127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,3072,0.05702310800552368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,1536,0.016083555089102853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,2048,0.042615112331178456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,1024,0.012422222230169507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,1536,0.03465777635574341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,768,0.009860444400045607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,8192,0.06931200292375353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,1024,0.02792533238728841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,512,0.00794577764140235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,256,0.006592888798978593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,768,0.02348800003528595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,128,0.005919111271699269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,512,0.019944889677895438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,51200,0.9031030866834852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,6144,128,0.01831733352608151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,7168,0.12168978320227729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,32,0.005562666803598404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,64,0.017210667332013447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,32,0.016880000631014507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,65536,0.3549511167738173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,2560,0.049828443262312144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,51200,0.34563554657830137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,16384,0.10246666934755112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,12288,0.08270133203930326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,16384,0.27267999119228786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,10240,0.0812622242503696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,12288,0.1899262269337972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,5120,64,0.005544888890451855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,8192,0.06222222248713175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,7168,0.04998311069276598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,128,0.01753777762254079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,6144,0.04343733191490173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,10240,0.15492178334130183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,51200,0.8347102271185981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,5120,0.03679644399219089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,8192,0.12553689214918348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,4096,0.03152711192766825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,7168,0.11237155066596137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,3584,0.027395556370417278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,3072,0.024599111742443506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,6144,0.09740533431371053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,5120,0.08267199993133545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,2560,0.02563200063175625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,4096,0.06838488578796387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,2048,0.01811644434928894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,1536,0.014539556370841132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,3584,0.06146488587061564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,3072,0.052449779378043286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,1024,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,768,0.008963555925422246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,2560,0.046090665790769786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,512,0.007242666350470648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,2048,0.04002755549218919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,1536,0.03153866529464722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,1024,0.025056888659795124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,128,0.005205333232879639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,768,0.021612443857722815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,64,0.004872000051869286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,512,0.018958222534921434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,32,0.004591111093759537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,256,0.01682577696111467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,128,0.016207110550668504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,64,0.016146666473812528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,32,0.016061334146393668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,5120,256,0.017855111095640395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,51200,0.3013519975874159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,4096,65536,1.0525627136230469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,16384,0.10029244422912598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,12288,0.08061510986751981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,10240,0.06017422013812595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,16384,0.2692382335662842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,12288,0.17866933345794678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,8192,0.050423112180497914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,10240,0.14578666951921251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,51200,0.766266663869222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,7168,0.0432533323764801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,65536,0.987360848320855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,4096,256,0.00628355559375551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,8192,0.11774933338165283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,5120,0.03204977843496535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,4096,0.026322666141721938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,7168,0.10484711329142253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,6144,0.09377866983413696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,3584,0.02369955513212416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,3072,0.020899555749363367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,5120,0.07807022333145142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,2560,0.018346667289733887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,4096,0.06362666686375935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,2048,0.015949333707491558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,1536,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,3072,0.05022755596372816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,1024,0.010741333166758219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,2560,0.043062223328484424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,2048,0.0370142228073544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,768,0.008645333349704742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,512,0.007311999797821045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,65536,0.39302221934000653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,256,0.0059004442559348206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,1024,0.0239991115199195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,128,0.004927111168702443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,768,0.020647111866209242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,512,0.018142221702469718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,64,0.004895110925038655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,256,0.01622488929165734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,128,0.015828443898095023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,64,0.015680889288584392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,32,0.015408888459205627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,65536,0.3033955627017551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,51200,0.25532976786295575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,16384,0.08280977937910292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,3584,0.056236445903778076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,16384,0.25078044997321236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,12288,0.065065774652693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3584,1536,0.029959999852710303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,10240,0.051663110653559365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,8192,0.04025600022739834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,51200,0.7232097519768609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,12288,0.17242933644188774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,32,0.005214222189452913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,7168,0.03614133265283372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,6144,0.03141866789923774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,8192,0.11191288630167644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,5120,0.028063111835055884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,4096,0.022664889693260193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,7168,0.10071111387676662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,6144,0.08712177806430393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,3584,0.02011999984582265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,5120,0.073853333791097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,3072,0.017981333865059745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3584,6144,0.03733511103524102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,2560,0.01591199967596266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,4096,0.06084533532460531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,2048,0.013493333425786761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,3584,0.05367911193105909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,1536,0.011231111155615913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,1024,0.008993777963850234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,3072,0.046738667620552905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,768,0.007643555601437886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,2048,0.03531288769510057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,512,0.006592888798978593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,1024,0.02279022170437707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,256,0.005380444642570283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,768,0.0199644449684355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,128,0.0046160001721647055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,256,0.015805333852767944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,64,0.0042239998777707415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,128,0.015512888630231222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,65536,0.9228053622775607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,3072,32,0.0042453333735466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,64,0.015132443772421943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,10240,0.1384613381491767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,32,0.014854222536087036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,65536,0.25768621762593585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,16384,0.07281866338517931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,51200,0.2250462108188205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,12288,0.05424888928731283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,10240,0.047929777039421924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,16384,0.21888711717393664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,12288,0.1629342238108317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,8192,0.03612355391184489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,10240,0.13154933187696669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,2560,0.04109955496258206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,7168,0.03051911128891839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,1536,0.028098666005664404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,6144,0.027169777287377253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,51200,0.6810888714260526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,5120,0.0236826671494378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,8192,0.10763555765151978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,4096,0.019792889555295307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,7168,0.09412266810735066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,65536,0.8742639753553602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,3584,0.01779022150569492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,6144,0.08239555358886719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,2560,0.014513777361975776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,4096,0.05651999844445122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,3584,0.05032711227734884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,3072,0.044750223557154335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,1536,0.010480889015727572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,2560,0.03855999973085191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,1024,0.008300444318188561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,2048,0.032983111010657415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,1536,0.027518222729365032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,768,0.0069164443347189165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,512,0.005946666830115848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,1024,0.02197511163022783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,256,0.004881777697139316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,768,0.019275556008021038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,512,0.01682844426896837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,128,0.00452888881166776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,64,0.003948444293604957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,256,0.015488889482286243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,32,0.004206222378545337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,128,0.015118221441904703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,64,0.014819555812411837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,32,0.014450665977266101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,65536,0.20279110802544487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,3072,512,0.01721333298418257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,51200,0.17189333173963758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,3072,0.016688000824716356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2560,5120,0.0700977775785658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,12288,0.043325334787368774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2560,2048,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,10240,0.03490399983194139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,8192,0.030962665875752766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,16384,0.20744800567626953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,12288,0.1527671151691013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,7168,0.02677244444688161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,10240,0.12458666165669759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,6144,0.021635555558734473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,5120,0.018736888964970905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,65536,0.8195102479722766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,51200,0.6421422428554958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,7168,0.08916088607576157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,4096,0.016345777445369296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,6144,0.07794400056203206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,3584,0.014518222875065274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,3072,0.013767110804716745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,2560,0.011720000041855706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,4096,0.054195556375715465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,3584,0.047770665751563184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,2048,0.009945777555306753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,3072,0.041814221276177295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,1536,0.008349333372380998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,2560,0.03677511215209961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,2048,0.031154665682050917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,768,0.00600622221827507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,1024,0.020921778347757127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,512,0.005208888815508948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,768,0.018550222118695576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,16384,0.059862222936418324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,256,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,128,0.0038844446341196695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,512,0.016185777054892648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,64,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,256,0.014649778604507446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,32,0.0036480000449551474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,128,0.014152000347773233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,64,0.01408622165520986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,8192,0.10025866826375325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,32,0.013765333427323235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,65536,0.20832355817159018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,16384,0.05459466576576233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,51200,0.1584213309817844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,12288,0.04149688945876227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,2048,1024,0.0069306666652361555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,16384,0.19651644759707979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,10240,0.03340977761480544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,12288,0.14427733421325684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,1536,0.025734222597546045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,8192,0.026712000370025635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,51200,0.6045093536376953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,65536,0.7695573170979818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,10240,0.11722044150034587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,6144,0.021147555775112573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,5120,0.01827911039193471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,8192,0.09463200304243301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,7168,0.08395644691255356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,4096,0.015671999918089975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,3584,0.013975110318925647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,6144,0.0734622213575575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,3072,0.012654222548007965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,5120,0.06135111384921604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,2560,0.010899555351999072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,2048,0.009328000247478485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,3584,0.0447964436478085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,1536,0.00811644477976693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,3072,0.039098666773902044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,2560,0.03398222062322829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,1024,0.006598222172922558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,2048,0.029742221037546795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,768,0.005933333188295364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,1536,0.024697777297761705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,1024,0.02029244436158074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,768,0.017649778061442904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,2048,5120,0.06618577904171415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,256,0.004535111288229625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,512,0.015801777442296345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,128,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,64,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,256,0.014110222458839417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,128,0.013761777844693927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,64,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,65536,0.13150755564371744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,7168,0.023698666029506262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,51200,0.1023813353644477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,16384,0.03658577799797058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,4096,0.049597332874933876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,16384,0.18480000231001112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,12288,0.02660088903374142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,10240,0.021702221698231165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,65536,0.7176791297064887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,51200,0.562877337137858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,512,0.005191111316283544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,12288,0.1387288835313585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,7168,0.016307555966907077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,6144,0.014873777826627096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,10240,0.11049155394236247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,5120,0.01312444441848331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,8192,0.08878666824764675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,7168,0.07942310969034831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,4096,0.011125333607196808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1536,32,0.003673777812057071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,6144,0.06834755341211955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,3584,0.009995555712117089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,3072,0.009015999734401703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,5120,0.05693866809209188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,2560,0.008238222036096785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,2048,0.00692622239391009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1536,32,0.013423110875818463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,3584,0.041788445578681103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,3072,0.037010666396882795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,1536,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,1024,0.005249777601824866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,2560,0.03151199883884854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,768,0.004587555511130227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,2048,0.027756444282001917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,512,0.0041751112374994485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,1536,0.023358222511079576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,256,0.0038293335172865125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,1024,0.01921955578856998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,128,0.003544888976547453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,64,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,512,0.014813333749771118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,256,0.013415111435784234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,32,0.003314666656984223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,128,0.01313688854376475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,64,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,65536,0.10428177648120457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,32,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,51200,0.0839937792883979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,16384,0.03324355681737264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,12288,0.025384000606007043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,1024,8192,0.019357333580652874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,10240,0.020922667450375024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,16384,0.17539466751946342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,12288,0.1291217803955078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,8192,0.017700443665186565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,10240,0.10472444693247478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,7168,0.015771556231710646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,6144,0.014115555418862237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,51200,0.534637345208062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,65536,0.676821337805854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,5120,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,4096,0.046831111113230385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,4096,0.011348444554540845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,7168,0.0746062199274699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,3584,0.00997688869635264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,6144,0.06465599934260051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,3072,0.009294222626421187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,5120,0.054021331999037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,4096,0.043825778696272105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,3584,0.03974755605061849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,2048,0.0069475554757648045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,3072,0.03503111004829407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,1536,0.00629688882165485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,1024,768,0.016826666063732572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,1024,0.005761777775155173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,2560,0.030177778667873804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,768,0.004928888960017098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,512,0.004206222378545337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,2048,0.026439110438028973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,1536,0.022163555026054382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,1024,0.018544889158672757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,256,0.0035662220584021676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,768,0.016209777858522203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,128,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,64,0.0032346666687064697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,256,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,32,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,128,0.012786666552225748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,64,0.012396444049146442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,65536,0.08633155292934841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,32,0.01220355596807268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,51200,0.06940088669459026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,16384,0.027170666389995154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,12288,0.021292444732454088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,8192,0.08383378055360581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,10240,0.019333332777023315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,16384,0.17419466707441542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,12288,0.12763822078704834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,8192,0.01650311052799225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,768,2560,0.008220444122950235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,7168,0.01648355523745219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,51200,0.5269324514600966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,10240,0.10310400194591945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,65536,0.6720408863491483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,8192,0.0827831096119351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,5120,0.012040889097584618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,7168,0.07304266426298353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,4096,0.009022222624884712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,3584,0.00832444429397583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,3072,0.007994666695594788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,6144,0.06366044282913208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,5120,0.05306222372584873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,4096,0.0431600014368693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,2560,0.00674044465025266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,3584,0.03800977932082282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,2048,0.006224000205596288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,768,512,0.01478666729397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,1536,0.005551110953092575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,3072,0.03371289041307237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,2560,0.02993511160214742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,768,0.004173333446184794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,2048,0.02643377747800615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,512,0.003663111064169142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,1536,0.022279111875428095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,256,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,1024,0.01815200017558204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,128,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,768,0.015934222274356417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,64,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,512,0.014512888259357877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,32,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,256,0.01276088919904497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,128,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,65536,0.04723644587728712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,51200,0.04201066825124952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,32,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,16384,0.015394666128688388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,12288,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,16384,0.16467732853359646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,12288,0.1196204423904419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,6144,0.013441777891582914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,10240,0.01346666696998808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,8192,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,51200,0.49595022201538086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,7168,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,6144,0.010668444136778513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,65536,0.631607108645969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,10240,0.0967893335554335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,5120,0.009361777868535783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,4096,0.007947555846638149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,7168,0.06834489107131958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,6144,0.059635553095075816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,3584,0.0075902218619982404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,512,1024,0.004554666578769684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,3072,0.006924444602595435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,5120,0.04892711175812615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,2560,0.006230222268237009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,4096,0.03968977928161621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,2048,0.0053182223604785065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,1536,0.004878222114510006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,3584,0.035903112755881414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,3072,0.03196977906756931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,2560,0.02810133496920268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,768,0.003896000070704354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,2048,0.02474400069978502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,1536,0.021143999364640977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,512,0.0038204445607132385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,256,0.0032248888164758682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,1024,0.017803554733594257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,512,64,0.01239377756913503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,768,0.015475556254386902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,512,0.01383733335468504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,64,0.002875555513633622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,256,0.01240533341964086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,128,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,65536,0.036335110664367676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,64,0.011681777735551199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,32,0.011704000333944956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,51200,0.02921066681543986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,16384,0.012524444195959302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,256,8192,0.07746489180458917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,51200,0.4955582088894314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,16384,0.16452356179555258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,12288,0.011345778074529437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,65536,0.6313466495937771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,10240,0.010377777947319878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,1024,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,12288,0.11975377135806614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,10240,0.09664711025026108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,7168,0.008978666530715095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,128,0.0031946665710873077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,6144,0.009306666751702627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,8192,0.07739200194676717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,5120,0.009025777379671732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,256,32,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,4096,0.007651555869314406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,3584,0.007096889118353526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,6144,0.05851466788185967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,3072,0.006527110934257507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,5120,0.04890399840142992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,4096,0.03970400161213345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,2560,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,2048,0.005227555417352253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,3584,0.035727110173967146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,1536,0.004557333472702238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,3072,0.03167288833194309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,1024,0.003906666818592283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,768,0.0038853333228164246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,2048,0.024757333927684363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,512,0.0035217776894569397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,1024,0.017621333400408428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,768,0.015560888581805758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,256,0.0032266666077905228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,512,0.013778666655222574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,128,0.002983111060327954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,64,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,256,0.012445333103338877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,32,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,128,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,64,0.011937778029176923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,65536,0.033744888173209295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,128,8192,0.00980711148844825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,32,0.011753777662913004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,16384,0.012080888781282636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,16384,0.1634942160712348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,7168,0.06881688700781928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,12288,0.010409778190983666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,10240,0.009735110733244155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,51200,0.49538665347629124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,8192,0.008973333570692275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,2560,0.028268443213568792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,12288,0.11884978082444932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,7168,0.008316444853941599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,128,1536,0.021037333541446265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,6144,0.008963555925422246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,8192,0.07685599724451701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,5120,0.00832622249921163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,7168,0.06839555501937866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,6144,0.05882844660017225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,5120,0.04890133274926079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,4096,0.039136889908048846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,3072,0.006284444282452266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,3584,0.03525688913133409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,51200,0.027639110883076985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,2560,0.005873777800136142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,2048,0.00526311124364535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,3072,0.03161155515246921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,1536,0.004518222063779831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,2560,0.02809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,1024,0.0038862224254343244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,2048,0.024774221910370722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,768,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,1536,0.020650666620996263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,512,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,1024,0.017518222332000732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,256,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,768,0.015454222758611044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,65536,0.6301564640469021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,128,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,512,0.013589333328935834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,32,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,256,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,10240,0.09691466887791951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,65536,0.03229866756333245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,128,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,64,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,64,32,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,12288,0.012771555946932899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,4096,0.007610666255156199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,10240,0.01106844428512785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,64,3584,0.007106666763623555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,8192,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,16384,0.16378133826785618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,12288,0.11922666761610244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,7168,0.010030222435792288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,10240,0.09642133447859023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,6144,0.01016266644001007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,5120,0.009312888814343346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,51200,0.49582931730482316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,8192,0.07699111435148451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,7168,0.06774399677912395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,65536,0.63010221057468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,3584,0.0069208890199661255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,6144,0.05879555808173286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,5120,0.04787288771735298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,3072,0.006617777877383762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,2560,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,4096,0.03910577628347609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,2048,0.00507377791735861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,3072,0.03155466583040025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,2560,0.028107557031843398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,1536,0.004571555389298333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,1024,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,1536,0.02085866696304745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,768,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,1024,0.01719911065366533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,512,0.003228444399105178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,16384,0.0101742222905159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,256,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,768,0.015446222490734525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,128,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,256,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,64,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,128,0.011762667033407422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,32,0.002528000002106031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,64,0.011773332953453064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,4096,0.007599111232492659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,32,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,3584,0.03496888942188687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,2048,0.024825778272416856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1281,32,51200,0.026565333207448322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1281,32,512,0.013577777478430005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,16384,1.5317243999905055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,12288,1.1228969362046983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,16384,1.8910880618625219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,12288,1.3665893342759874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,16384,1.7068426344129775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,10240,1.1035938262939453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,10240,0.9508363935682508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,51200,4.831900278727214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,12288,1.2205493715074327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,8192,0.7868835661146375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,8192,0.8653333452012805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,7168,0.7002915806240506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,10240,0.9718248579237195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,7168,0.810191101498074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,6144,0.5292328728569878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,5120,0.4448426564534505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,5120,0.5699271096123589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,51200,6.621859656439887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,8192,0.8099377950032552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,6144,0.6544062296549479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,7168,0.7048320240444608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,6144,0.6014862060546875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,3584,0.3079377810160319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,4096,0.3571431106991238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,4096,0.44063199890984434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,3584,0.4024666680230035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,3072,0.2664408948686388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,2560,0.25893955760531956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,5120,0.5052968660990397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,3072,0.3398328887091742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,4096,0.415699561436971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,2048,0.18984711170196533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,3584,0.370344877243042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,2560,0.29013244311014813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,3072,0.3202213446299235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,1536,0.1388346619076199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,1024,0.1097831130027771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,2048,0.23438933160569933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,1536,0.18765510453118217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,2560,0.27547023031446666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,768,0.07698488897747464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,2048,0.230621337890625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,1536,0.18529066774580213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,512,0.058394663863711886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,1024,0.14374755488501653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,256,0.04376711116896736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,1024,0.14778844515482584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,768,0.1131226619084676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,768,0.12231555249955918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,128,0.03923377725813124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,512,0.09829955630832249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,512,0.10172533326678806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,64,0.03614577651023865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,256,0.08221599790785047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,256,0.09028533432218765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,128,0.06732889016469319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,128,0.0829555524720086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,64,0.08250844478607178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,65536,32,0.08278489112854004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,65536,32,0.036525332265430026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,16384,1.1952169206407335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,65536,51200,5.4733022054036455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,51200,3.7417822943793406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,16384,1.5006986194186742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,12288,0.9144212934705945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,65536,4.8728718227810335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,12288,1.0582479900783963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,51200,5.110416836208768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,10240,0.8276044527689616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,10240,0.8930408689710828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,16384,1.321772469414605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,65536,7.014613257514106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,12288,0.9711653391520182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,8192,0.5905884636773003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,8192,0.7162115308973523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,7168,0.47875197728474933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,7168,0.6309599876403809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,10240,0.799624866909451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,6144,0.446074644724528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,8192,0.644421312544081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,5120,0.38648711310492617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,6144,0.5208595593770345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,7168,0.5723244349161783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,51200,4.350642734103732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,4096,0.2799786726633708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,6144,0.4894595675998264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,3584,0.24532710181342232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,5120,0.4505822393629286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,4096,0.36504356066385907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,3072,0.23584445317586264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,3584,0.31434843275282115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,3072,0.266536898083157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,2560,0.21106221940782335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,4096,0.3490275541941325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,5120,0.41184266408284503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,2048,0.1552799940109253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,3072,0.26310933960808647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,1536,0.11917955345577663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,2048,0.1886284483803643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,2560,0.2272497812906901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,2560,0.2427519957224528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,1024,0.08493955267800225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,1536,0.15285332997639975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,2048,0.18986577457851836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,768,0.0646666685740153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,512,0.050139556328455605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,1024,0.11493155691358779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,1536,0.16036532984839544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,1024,0.12675466802385119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,256,0.0369484457704756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,768,0.09267999728520711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,128,0.03087644444571601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,512,0.08581688668992783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,512,0.07965777979956733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,256,0.07327200306786431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,256,0.07307377788755628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,32,0.026428444517983332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,128,0.057486222849951855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,64,0.0675635536511739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,32,0.06783377461963229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,3584,0.3071520063612196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,65536,5.696567111545139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,51200,768,0.10179199775060017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,51200,64,0.02611555490228865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,51200,128,0.06834666596518622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,51200,1.2102852927313912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,65536,1.6194995244344075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,16384,0.40955021646287704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,12288,0.3110151025984022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,16384,0.5602622032165527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,12288,0.4433564345041911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,10240,0.2602391242980957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,51200,1.9374249776204426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,65536,2.353417714436849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,10240,0.3404826588100857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,8192,0.2194746732711792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,16384,0.5676222377353245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,12288,0.4414515495300293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,7168,0.19396444161732992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,8192,0.2661840120951335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,10240,0.3571191098954942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,6144,0.16109332773420545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,8192,0.28585423363579643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,7168,0.23599910736083984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,5120,0.1425795555114746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,6144,0.20175466272566053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,7168,0.25446311632792157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,6144,0.22079377704196504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,4096,0.10744711425569321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,5120,0.1723866727617052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,3584,0.09823911057578193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,5120,0.18887466854519316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,4096,0.1400408877266778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,3072,0.085825781027476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,4096,0.15755555364820692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,3584,0.14227022065056696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,2560,0.07541777690251668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,3072,0.10951911078559028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,3072,0.12545066409640843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,2048,0.06037155787150065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,3584,0.1279546684688992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,2560,0.09472444322374131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,1536,0.04495555493566725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,2560,0.11003110806147258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,1024,0.032390223609076604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,2048,0.0797884464263916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,2048,0.09450844261381362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,51200,1.779327180650499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,1536,0.0781902207268609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,768,0.025613332788149517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,1536,0.06474133332570393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,512,0.018442667192882962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,1024,0.04921333326233757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,1024,0.06586844391292997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,65536,2.3142142825656467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,256,0.014762666490342883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,768,0.05539555682076348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,128,0.011585777832402123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,768,0.0447671115398407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,512,0.04718666606479221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,512,0.03359555535846286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,64,0.010669333239396414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,16384,32,0.010219555762079027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,128,0.033831109603246055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,128,0.02847911251915826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,64,0.028466665082507666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,32,0.029112001260121662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,51200,1.0739680396185982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,65536,1.216618643866645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,16384,256,0.02975644336806403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,16384,256,0.04424444503254361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,16384,0.3296062151590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,51200,1.4919172922770183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,16384,0.4527511066860623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,12288,0.23959199587504068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,65536,1.9787110222710504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,10240,0.20992088317871094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,16384,0.4897431267632379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,8192,0.1895324389139811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,10240,0.2756248844994439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,12288,0.36605511771308047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,7168,0.14073422220018175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,8192,0.24554488393995497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,10240,0.31040623452928334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,7168,0.19005421797434488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,8192,0.24791023466322157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,6144,0.13968888918558756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,5120,0.11218489540947808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,7168,0.22053333123524985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,6144,0.16811554961734346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,6144,0.19145333766937256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,5120,0.14781067106458876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,4096,0.08094933297899035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,3584,0.08068533076180352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,5120,0.16423111491733128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,65536,1.9710364871554906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,12288,0.32878756523132324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,4096,0.11599822839101155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,3072,0.06884533166885376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,4096,0.13819111718071833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,2560,0.05839733282725016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,3584,0.10287200080023871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,3584,0.12571911017100015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,2048,0.0447377794318729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,1536,0.03603466682963901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,3072,0.09356266922420925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,3072,0.11026933458116318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,2560,0.07872355646557279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,2048,0.06681866778267755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,2048,0.08405955632527669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,51200,1.523787604437934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,768,0.021282666259341772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,1536,0.07106400198406644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,1024,0.0410755541589525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,512,0.018201778332392376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,1024,0.05756711297565036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,256,0.014541332920392355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,768,0.05023022161589729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,768,0.03431288732422723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,512,0.043656001488367714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,128,0.012568888564904531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,256,0.036588443650139704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,64,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,128,0.02450399928622776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,32,0.012133333418104382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,64,0.024002666274706524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,32,0.02405599918630388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,2560,0.09682399696773952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,12288,1024,0.024711110525661047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,1536,0.051989333497153394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,512,0.02846577763557434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,65536,1.0180560217963326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,12288,256,0.024898666474554274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,12288,128,0.031537777847713895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,51200,0.6971706814236112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,16384,0.2774604426489936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,12288,0.1880720059076945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,16384,0.40172799428304035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,10240,0.1469448937310113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,12288,0.3182595570882161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,65536,1.690707524617513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,16384,0.4529511133829753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,51200,1.3015644285413954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,8192,0.1294364399380154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,10240,0.2409422132703993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,7168,0.10451466507381862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,8192,0.19219822353786895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,12288,0.3461137877570258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,10240,0.285753779941135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,6144,0.10569333367877537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,7168,0.17010933823055693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,5120,0.08211733235253228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,7168,0.20696889029608834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,6144,0.14840800232357448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,6144,0.17939378155602348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,4096,0.07187644640604655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,5120,0.12607822153303358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,5120,0.15290844440460205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,3584,0.05853955613242256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,4096,0.10469688971837361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,4096,0.12839555740356445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,3072,0.054096887509028115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,3584,0.09248533513810898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,3584,0.11575822035471599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,51200,1.3798133002387152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,2560,0.04609510964817471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,3072,0.08240622282028198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,3072,0.10329244534174602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,2048,0.03710755705833435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,1536,0.026014222039116755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,65536,1.766048855251736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,2560,0.09072977966732448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,2048,0.058965331978268094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,1024,0.01869155632125007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,1536,0.046719110674328275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,1536,0.06653066476186116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,768,0.015770667129092746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,8192,0.2287964555952284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,1024,0.037520888778898455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,512,0.014089778065681458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,768,0.031002667215135362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,768,0.046606222788492836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,256,0.010405333505736457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,512,0.025753777888086107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,512,0.04081244601143731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,128,0.009312888814343346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,256,0.035192890299691096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,256,0.023014222582181294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,64,0.008900444540712569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,128,0.028831998507181805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,10240,32,0.00885333369175593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,128,0.022052443689770166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,64,0.021990221407678392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,32,0.02167111138502757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,10240,2560,0.07086400190989177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,2048,0.0779786639743381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,10240,1024,0.054423110352622144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,65536,0.7704062461853027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,51200,0.6511617766486274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,16384,0.23935466342502168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,12288,0.18035377396477592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,16384,0.37047555711534286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,65536,1.4494329028659398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,16384,0.43145065837436253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,12288,0.28853511810302734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,10240,0.1412257750829061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,51200,1.139287100897895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,8192,0.11160800192091201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,10240,0.21255644162495932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,8192,0.16915644539727104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,7168,0.11160355144076878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,10240,0.26566844516330296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,6144,0.09336266915003459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,8192,0.21779021951887342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,7168,0.14932178126441106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,7168,0.1875751150978936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,5120,0.07500355773501925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,6144,0.1307742198308309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,51200,1.2605999840630424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,4096,0.05628177854749891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,6144,0.1633840004603068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,65536,1.6113502714369032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,3584,0.04978044496642219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,5120,0.11059644487169053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,5120,0.1400159994761149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,4096,0.0917137795024448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,3072,0.044180442889531456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,4096,0.11812622017330593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,3584,0.0827360020743476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,2560,0.03874222106403775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,3584,0.10607200198703343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,2048,0.03255911005867852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,3072,0.07358577516343859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,1536,0.024919999970330134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,2560,0.06231377522150675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,2560,0.08361422353320652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,2048,0.05199999941719902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,1024,0.017729777428838942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,2048,0.0735351112153795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,12288,0.3120453357696533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,768,0.014287999934620328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,1536,0.04202488727039761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,1536,0.060657779375712075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,512,0.011391110718250275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,256,0.008732444710201686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,1024,0.050556444459491305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,1024,0.0336773329310947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,768,0.04407199886110094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,768,0.027503111296229895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,128,0.0073831114504072405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,512,0.02336799932850732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,64,0.008290666672918532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,256,0.03206133180194431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,8192,32,0.00867911097076204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,128,0.020283554991086323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,64,0.01995022263791826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,32,0.019664888580640156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,65536,0.61135286755032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,3072,0.0952026645342509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,512,0.03763644562827216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,8192,256,0.020621332857343886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,51200,0.5264933374192979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,8192,128,0.0273671117093828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,16384,0.16953599452972412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,65536,1.3333359824286566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,12288,0.11465333567725287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,16384,0.37272267871432835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,51200,1.0502150853474934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,12288,0.23820355203416613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,16384,0.3815600077311198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,10240,0.10939911339018081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,8192,0.09689866834216648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,12288,0.28415200445387095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,10240,0.195269332991706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,7168,0.08294666475719877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,8192,0.15921955638461643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,10240,0.2373164494832357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,6144,0.06332888868119982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,8192,0.19356444146898058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,7168,0.13813511530558267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,65536,1.465725368923611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,7168,0.17201244831085205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,6144,0.120943996641371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,4096,0.04889600144492256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,6144,0.1505733331044515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,3584,0.04346399837070041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,5120,0.10261599885092841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,5120,0.12977777587042913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,4096,0.10945866505304973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,4096,0.08549066384633382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,51200,1.1535636054144967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,3584,0.07508889171812269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,3584,0.0984755555788676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,2560,0.03300889001952277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,3072,0.08789955245123969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,3072,0.06778222322463989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,2048,0.027107555005285475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,1536,0.02054755555258857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,2560,0.07721955246395536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,2560,0.05834666887919108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,1024,0.015308444698651632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,2048,0.0495777792400784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,2048,0.06770044565200806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,768,0.012161778079138862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,1536,0.039800001515282526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,1024,0.04771022333039177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,1024,0.031889776388804116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,512,0.009694221946928237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,768,0.026183999247021143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,768,0.041555556986067034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,256,0.007321777443091075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,512,0.03432800041304694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,512,0.02200177808602651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,128,0.007152888509962294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,256,0.031405333015653826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,256,0.01974933346112569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,5120,0.06035821967654758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,64,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,32,0.006414222220579783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,128,0.019208888212839764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,64,0.01897333396805657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,7168,32,0.018599111172888014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,7168,3072,0.03698044353061252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,65536,0.5530248747931586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,51200,0.5366835594177246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,1536,0.05685955286026001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,16384,0.3360133435991075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,51200,0.9693386289808484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,7168,128,0.02740266587999132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,12288,0.1276871098412408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,65536,1.242744869656033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,16384,0.3787555429670546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,10240,0.11387288570404053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,12288,0.21980178356170654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,8192,0.09108977847629124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,10240,0.18043911457061768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,12288,0.2810320059458415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,10240,0.23511200480990938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,8192,0.14489155345492893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,51200,1.1377323998345268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,6144,0.061568001906077065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,8192,0.20382222864362928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,7168,0.128257777955797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,16384,0.15838400522867838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,5120,0.05620977613661024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,7168,0.1701893276638455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,4096,0.04452711012628344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,6144,0.11158133877648248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,6144,0.14863022168477377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,65536,1.455567995707194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,5120,0.09575288825564915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,4096,0.0792799989382426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,3584,0.0380657778845893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,5120,0.12857066260443792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,3072,0.03462310963206821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,4096,0.10802844497892593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,2560,0.029567999972237483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,3584,0.09798755248387654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,3584,0.07031822204589844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,3072,0.08673599693510269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,3072,0.05977244509590996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,2048,0.02550044490231408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,2560,0.07663644684685601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,2560,0.05344533258014255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,1024,0.015435554915004306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,2048,0.06726221905814277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,2048,0.04485333296987745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,1536,0.0367253323396047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,768,0.012702222499582501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,1536,0.056120885743035205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,512,0.009993777506881291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,1024,0.04679200053215027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,1024,0.029061334000693426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,256,0.007607111500369177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,768,0.024344000551435683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,7168,0.0771813326411777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,128,0.006573333508438534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,512,0.020647999313142564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,256,0.02974489000108507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,256,0.01860000027550591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,64,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,32,0.006606222026877933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,128,0.026102221674389307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,128,0.018248889181349013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,64,0.01793066660563151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,6144,32,0.01758044461409251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,65536,0.4882515801323785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,51200,0.40781688690185547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,6144,1536,0.01976088848378923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,16384,0.13599644766913518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,768,0.0391591125064426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,6144,512,0.03441333439615037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,16384,0.27542932828267414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,65536,1.1312987009684246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,12288,0.10524355702930027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,10240,0.0768231087260776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,16384,0.3433982266320123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,12288,0.20203910933600533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,8192,0.0695377786954244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,12288,0.2545626693301731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,10240,0.1649457746081882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,7168,0.06331821944978502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,10240,0.2135066721174452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,8192,0.13292800055609807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,8192,0.17422844303978813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,7168,0.117594665951199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,65536,1.3154417673746746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,5120,0.046903110212749906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,7168,0.15464622444576687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,4096,0.038174221913019814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,6144,0.10346311330795288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,51200,1.03676266140408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,6144,0.13613243897755942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,5120,0.08864711390601264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,5120,0.11771199438307021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,3072,0.028182221783532038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,4096,0.07329422235488892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,4096,0.09927822483910455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,3584,0.06520089175966051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,3584,0.0896035565270318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,2560,0.024336000283559162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,2048,0.020224000016848247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,3072,0.05541422300868564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,3072,0.07954488860236274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,1536,0.01608711149957445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,2560,0.07058133019341363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,2560,0.04827555682924059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,1024,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,2048,0.041542222102483116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,51200,0.9017893473307291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,1536,0.051184889343049794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,1536,0.03381244341532389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,768,0.0103511114915212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,512,0.007967111137178209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,1024,0.04183822207980686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,768,0.02251200046804216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,256,0.006592000110281839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,512,0.01959911154376136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,512,0.03256888853179084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,128,0.006075555665625467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,256,0.029840889904234145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,128,0.017238222890430026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,64,0.0052391112678580815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,128,0.025920000341203477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,32,0.005836444596449534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,3584,0.03156444430351257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,64,0.017177777157889474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,32,0.016866667403115165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,2048,0.06213866339789497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,65536,0.46964179144965273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,1024,0.02711822258101569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,5120,768,0.03703377644220988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,51200,0.38622223006354434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,5120,6144,0.05471822288301256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,16384,0.12404266993204753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,65536,1.0187181896633573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,12288,0.09818222125371297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,51200,0.7958578003777398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,16384,0.34610488679673934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,12288,0.1833040051990085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,10240,0.07577866978115506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,12288,0.2533342308468289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,10240,0.15148533715142146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,8192,0.05968622366587321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,10240,0.2126613325542874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,51200,1.0219155417548287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,7168,0.0520924429098765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,8192,0.12200178040398492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,5120,256,0.01755822201569875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,65536,1.3006533516777885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,8192,0.1724231110678779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,6144,0.04246755441029867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,5120,0.03761333227157593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,7168,0.15467111269632974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,7168,0.108660446272956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,6144,0.09511288669374253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,5120,0.08145955536100599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,5120,0.1166986624399821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,16384,0.25155822436014813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,3584,0.02589955594804552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,4096,0.06636089086532593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,3072,0.022745778163274128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,4096,0.09794755776723225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,2560,0.020961778031455144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,3584,0.08888889021343654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,3584,0.05893955628077189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,3072,0.07866755459043714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,3072,0.051539556847678296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,1536,0.01309333327743742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,2560,0.04435377650790744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,2560,0.06983644432491727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,2048,0.03872355487611558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,2048,0.061262223455641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,1024,0.009926222264766693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,768,0.008746667040718926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,1536,0.04987466666433546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,1536,0.03092799915207757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,512,0.006978666616810693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,1024,0.04315200116899279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,768,0.02106933295726776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,768,0.03637955586115519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,256,0.006233777850866318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,512,0.032179554303487144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,512,0.018215111560291715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,128,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,256,0.02882044514020284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,64,0.005277333160241445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,128,0.016166221764352586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,32,0.005227555417352253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,4096,0.030458665556377832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,64,0.015848888291252982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,32,0.015525332755512662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,65536,0.3515377839406331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,51200,0.2581617832183838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,1024,0.024757333927684363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,4096,256,0.016505777835845947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,65536,0.9600622389051648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,128,0.02504088812404209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,16384,0.09943644205729167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,4096,6144,0.13510666953192815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,12288,0.07263021998935275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,16384,0.23982487784491646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,10240,0.05708444118499756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,51200,0.7833991050720215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,12288,0.17497600449456108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,16384,0.3078542285495334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,12288,0.2271662288241916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,4096,2048,0.017606221967273288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,8192,0.04803911182615492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,65536,1.1691172917683919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,7168,0.04377955529424879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,10240,0.14375110467274985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,6144,0.03672711054484049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,8192,0.11663644843631321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,10240,0.1940551069047716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,8192,0.15516800350613064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,5120,0.030954665607876245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,7168,0.13895821571350098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,4096,0.02544622288809882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,51200,0.917825804816352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,6144,0.12242133087582058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,6144,0.09059644407696194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,3584,0.023690667417314317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,5120,0.1054275565677219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,3072,0.019903111788961623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,4096,0.08926666445202297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,4096,0.06311555703481038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,3584,0.08132711384031507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,2560,0.017607111069891188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,3584,0.05551200111707052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,3072,0.07233688566419813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,2048,0.015142222245534262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,3072,0.04929688904020521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,1536,0.012755555411179861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,2560,0.06387377447552152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,2560,0.04249866803487142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,2048,0.05674666828579373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,1024,0.009524444739023844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,2048,0.03692355420854356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,768,0.00798044436507755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,1536,0.02997866604063246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,1536,0.04692088895373874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,1024,0.038784000608656145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,1024,0.023952000670962866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,768,0.03432800041304694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,768,0.020614221692085266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,256,0.005541333307822545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,512,0.03047200043996175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,512,0.017847999930381775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,128,0.004879111217127906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,256,0.027433777848879497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,64,0.00424888895617591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3584,128,0.024345777100986902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,32,0.004513777792453766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,7168,0.10372177759806316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,64,0.015444444285498725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,32,0.015104888214005364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,5120,0.07822489076190524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,65536,0.3004773457845052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,51200,0.2616808944278293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3584,512,0.0069715554515520734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,16384,0.09038399987750584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,65536,0.9160399966769748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,256,0.016403555870056152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,51200,0.7118613455030652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3584,128,0.01551466683546702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,12288,0.06788622008429633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,16384,0.2242622110578749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,10240,0.05769333574506971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,12288,0.1675137811236911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,16384,0.3059075673421224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,10240,0.13800266053941515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,12288,0.22738756073845756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,8192,0.04281511240535312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,10240,0.18984711170196533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,7168,0.0402471125125885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,65536,1.1670257780287001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,51200,0.9197538163926867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,8192,0.11105777819951375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,7168,0.09883111053042942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,8192,0.155057774649726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,7168,0.13852889007992214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,5120,0.02942488922013177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,4096,0.025013332565625507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,6144,0.08650577730602688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,6144,0.12168178293440078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,5120,0.07379021909501818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,3584,0.021942221456103857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,4096,0.059803558720482715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,3072,0.01978488928741879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,4096,0.08901421891318427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,2560,0.017690666847758822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,3584,0.05300266544024149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,3584,0.08074222008387248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,3072,0.04659644431538052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,3072,0.0720391141043769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,2048,0.01498044364982181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,1536,0.01242844429281023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,2560,0.0406622224383884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,2560,0.06367288695441352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,2048,0.056333336565229625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,2048,0.034952001439200506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,1024,0.00960177762640847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,768,0.008279999925030602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,1536,0.045824001232783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,1536,0.029117332564459905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,512,0.0069271110826068455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,1024,0.03873599900139703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,1024,0.022679110368092854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,768,0.0342497792508867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,768,0.019627556204795837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,256,0.006162666612201267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,128,0.004886222382386525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,512,0.01717866626050737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,512,0.030136889881557886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,64,0.00490133340160052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,256,0.027404444085227117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,256,0.015536889433860779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,6144,0.03484355409940084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,3072,32,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,128,0.015164444843928019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,64,0.01482311056719886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,3072,32,0.014828445182906257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,65536,0.259676456451416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,5120,0.10503555668724908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,51200,0.21754488680097792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,16384,0.07627822293175592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,16384,0.21743199560377333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,12288,0.05533688929345873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,16384,0.30495556195576984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,51200,0.6739697986178927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,65536,0.8644568655225965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,10240,0.04692177640067207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,12288,0.15955021646287706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,8192,0.0363031095928616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,12288,0.22515198919508192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,10240,0.13134933842553034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,3072,128,0.024150222539901733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,10240,0.18869600031110975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,7168,0.03300177719857957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,6144,0.030177778667873804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,8192,0.10581244362725152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,8192,0.15405244297451443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,51200,0.9162231021457248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,65536,1.1611910925971138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,5120,0.024559999505678814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,7168,0.13751199510362414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,4096,0.020326221982638042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,6144,0.08220889170964558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,6144,0.12028888861338298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,3584,0.018041777941915724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,5120,0.06978399886025323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,5120,0.10463288757536147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,4096,0.05695644352171156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,4096,0.08801955646938747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,3072,0.01630311045381758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,2560,0.014486221803559197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,3584,0.050387554698520236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,3584,0.07995733287599352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,2048,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,3072,0.044181333647833936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,3072,0.07155822383032905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,2560,0.03844533363978068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,2560,0.06338755289713542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,2048,0.032540443870756365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,2048,0.05626577801174588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,1536,0.046422223250071205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,768,0.007307555940416124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,1024,0.0384133325682746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,1024,0.021776000658671062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,512,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,768,0.01887022289964888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,512,0.01649777756796943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,256,0.004872888740566042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,512,0.030185778935750324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,256,0.014800889624489678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,256,0.027083555857340496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,7168,0.0936702224943373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,128,0.004547555413511065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,64,0.0041742221348815495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,128,0.01443555619981554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,128,0.0239955551094479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,32,0.004202666795916027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,64,0.014109333356221518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,32,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,65536,0.23045688205295137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,1024,0.00795199970404307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2560,1536,0.027306665976842243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,51200,0.157425774468316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,16384,0.0597297747929891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2560,768,0.034120000070995755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,65536,0.8170222176445855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,16384,0.21847111648983428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,12288,0.0444160004456838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,51200,0.6372888882954916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,16384,0.3028533458709717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,10240,0.037864890363481306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,12288,0.15431643856896296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,8192,0.02956355611483256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,12288,0.22475022739834258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,10240,0.12411022186279297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,10240,0.1879582272635566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,7168,0.02641422218746609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2560,1536,0.010405333505736457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,51200,0.9044666290283203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,65536,1.151733292473687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,6144,0.023403555154800415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,5120,0.020027556353145175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,7168,0.08860888746049668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,7168,0.13696889082590738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,4096,0.017490666773584154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,6144,0.07771199941635132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,6144,0.1204213301340739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,3584,0.015465777781274585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,5120,0.06621244218614367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,5120,0.1033982237180074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,3072,0.014131555954615274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,4096,0.08800711234410603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,2560,0.012302222351233164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,3584,0.04753777715894911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,3584,0.07998133367962308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,2048,0.010568000376224518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,3072,0.07093955410851373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,2560,0.036016888088650174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,2560,0.06310755676693387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,1536,0.008626666333940294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,2048,0.05568799707624647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,2048,0.03198400139808655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,1024,0.0069288888739215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,1536,0.025593777497609455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,1536,0.045215109984079994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,768,0.006124444305896759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,1024,0.021021333005693223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,1024,0.03839733203252157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,512,0.005220444252093633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,768,0.017992888887723286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,768,0.033987555238935686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,256,0.004561777744028303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,8192,0.10104799932903713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,8192,0.15309777524736193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,512,0.016171556380059984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,512,0.030512889226277668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,128,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,64,0.004867555366622077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,256,0.01461955573823717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,256,0.026826666461096868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,2048,32,0.00490399988161193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,2048,128,0.02370133333735996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,128,0.014095111025704278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,64,0.013745778136783175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,32,0.01348977784315745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,4096,0.0536008874575297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,65536,0.1897137827343411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,51200,0.1346328920788235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,16384,0.050119111935297646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,2048,3072,0.041745778587129384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,12288,0.03581600056754218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,16384,0.1958400011062622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,16384,0.26820354991488987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,12288,0.14392533567216662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,10240,0.03049600124359131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,51200,0.599872907002767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,65536,0.7673395474751791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,8192,0.025223111112912495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,12288,0.1991164419386122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,7168,0.02198133369286855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,10240,0.11737510893079971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,10240,0.17103111743927002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,8192,0.0944604476292928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,6144,0.01945955554644267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,8192,0.13618489106496176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,51200,0.7973946465386285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,5120,0.016864889197879367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,7168,0.08385777473449707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,65536,1.01400269402398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,4096,0.014408888088332282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,6144,0.10784266392389934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,6144,0.07317511240641277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,3584,0.01331822243001726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,5120,0.09201066361533271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,5120,0.06155911419126722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,3072,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,4096,0.0786328911781311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,4096,0.049944000111685864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,2560,0.010390222072601318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,3584,0.04474222328927782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,3584,0.07208977805243598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,2048,0.00884622252649731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,3072,0.06390488810009427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,1536,0.007303111255168915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,2560,0.05681155787573921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,2048,0.029603554142846003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,2048,0.05064800050523546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,1024,0.005937777873542573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,1536,0.02440266642305586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,1536,0.0411102208826277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,768,0.005592888842026393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,1024,0.020271110865804885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,512,0.004879111217127906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,768,0.017364444004164804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,768,0.031167109807332356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,256,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,512,0.015495111544926962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,512,0.028127110666698877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,128,0.00388711111413108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,256,0.013757333159446716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,256,0.02609866691960229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,64,0.003539555602603488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,7168,0.12149422698550755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,128,0.02296977738539378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,128,0.013395555317401886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1536,32,0.0035573335157500375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,64,0.01346666696998808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,65536,0.1359457837210761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,32,0.013085333009560903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,51200,0.10769689083099365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,16384,0.036907556984159685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,3072,0.03917422228389316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1536,2560,0.0344124436378479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,12288,0.026208889153268602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,16384,0.18487289216783312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1536,1024,0.03530044356981913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,16384,0.26696356137593585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,12288,0.13505155510372585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,65536,0.7175537745157877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,51200,0.5631555451287164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,8192,0.0184515549076928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,12288,0.19701245095994738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,10240,0.11025955279668172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,10240,0.16543022791544595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,8192,0.08859466844134861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,7168,0.016968000266287062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,51200,0.7931733131408691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,6144,0.015053333507643806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,8192,0.1351999971601698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,65536,1.0085350672403972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,5120,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,7168,0.12047466966840957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,7168,0.07853066921234131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,6144,0.10592266586091782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,4096,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,6144,0.06799377997716267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,3584,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,5120,0.057272891203562416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,5120,0.09203288952509563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,3072,0.009020444419648912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,4096,0.04623111089070638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,4096,0.07785333527459039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,3584,0.041393776734670006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,3584,0.07131555345323351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,2048,0.0074480002125104266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,3072,0.03638933433426751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,3072,0.061942219734191895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,1536,0.006585777633719974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,2560,0.03153511219554477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,2560,0.05447644326421949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,1024,0.0055440002017551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,2048,0.027687999937269423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,2048,0.04870577653249105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,768,0.004910222358173794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,1536,0.023024888502226934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,1536,0.04053689042727152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,512,0.004261333495378494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,1024,0.01923022170861562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,1024,0.03463644451565213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,10240,0.022361778550677832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,256,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,768,0.03115644388728672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,768,0.01651822196112739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,128,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,512,0.01499111122555203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,512,0.0277528895272149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,64,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,256,0.013474666410022311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,256,0.025007999605602686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,32,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,128,0.013057777451144325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,64,0.012720000412729053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,65536,0.10043911139170329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,1024,32,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,51200,0.08318310976028442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,16384,0.03211377726660834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,1024,2560,0.008348444269763099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,16384,0.17557333575354683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,12288,0.023798222343126934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,51200,0.5326684315999349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,65536,0.6778426700168185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,10240,0.02088622252146403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,16384,0.2631751166449653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,12288,0.1285031106736925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,8192,0.017272889614105225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,10240,0.10461333062913682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,51200,0.7809564272562662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,7168,0.016220443778567843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,65536,0.994606229994032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,10240,0.1635377804438273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,6144,0.014316444595654806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,8192,0.13313155704074436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,1024,128,0.02230577833122677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,5120,0.012262221839692859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,7168,0.07469689183764987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,7168,0.11939111020829941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,4096,0.010441777606805166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,6144,0.06464355521731906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,6144,0.105131553279029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,3584,0.009368889033794403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,5120,0.05267644590801663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,4096,0.044103112485673696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,3072,0.008614222208658854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,3584,0.0391244457827674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,3584,0.07006222009658813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,2560,0.008015111088752747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,3072,0.03435644507408142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,2560,0.03024622135692173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,2048,0.006919999917348226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,2560,0.05424977673424614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,2048,0.026497777965333726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,12288,0.19537422392103407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,2048,0.04809955424732632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,1536,0.005937777873542573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,1024,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,1536,0.040425777435302734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,8192,0.08380977974997626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,1536,0.022346667117542688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,1024,0.01854933301607768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,1024,0.034621334738201566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,512,0.00416088890698221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,768,0.016176889340082806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,5120,0.09045510821872288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,4096,0.07633866866429646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,256,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,512,0.014499555031458536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,512,0.028295109669367473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,128,0.003536888708670934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,256,0.025721778472264607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,256,0.013415999710559845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,64,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,128,0.012763555679056378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,128,0.021948445174429152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,65536,0.07343111435572307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,32,0.01276000009642707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,768,0.004583111239804162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,51200,0.05871555540296766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,65536,0.6707493464152018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,768,0.031001776456832886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,16384,0.024264888630972967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,16384,0.1743617720074124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,768,32,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,768,3072,0.06128088633219401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,12288,0.020232889387342665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,51200,0.5274017651875814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,10240,0.018897778458065458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,12288,0.1269564496146308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,16384,0.26289688216315377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,12288,0.19425422615475127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,8192,0.014484445254007975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,10240,0.10293244653277928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,7168,0.012991111311647626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,10240,0.16287022166781956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,8192,0.08285955588022868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,8192,0.13289422459072536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,6144,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,7168,0.07332355446285672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,7168,0.11898933516608344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,5120,0.010327999790509542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,6144,0.06383911106321546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,6144,0.10439999898274739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,4096,0.011124444504578909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,5120,0.05303200085957845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,5120,0.09047555261188084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,3584,0.008038221961922115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,4096,0.04368444283803304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,4096,0.07670488622453478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,3072,0.0074035558435651995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,3584,0.03873777720663283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,3584,0.06965066989262898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,2560,0.006623999940024481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,3072,0.03389066788885329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,3072,0.06024089124467638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,2048,0.0058346668051348785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,2560,0.029839111698998347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,1536,0.005220444252093633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,2048,0.026106667187478807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,2048,0.047601779301961265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,1024,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,51200,0.7794711324903699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,1536,0.04016444418165419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,768,0.0041884444653987885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,1024,0.01824355622132619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,1024,0.034308443466822304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,512,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,768,0.015469332536061605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,512,0.014142221874660917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,256,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,512,0.027070222629441157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,256,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,256,0.024849777420361836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,128,0.0032026666320032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,64,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,65536,0.9888871510823568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,128,0.021439111895031396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,512,32,0.0031840000301599503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,768,64,0.012527111503813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,64,0.012411555482281579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,2560,0.05395466751522488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,32,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,51200,0.03732622332043118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,1536,0.021988444858127173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,16384,0.01534400052494473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,512,768,0.031203554736243352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,51200,0.4965830908881293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,65536,0.6315920088026259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,16384,0.1644702222612169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,12288,0.014545778433481852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,10240,0.01313066648112403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,12288,0.11981777350107829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,16384,0.2611253261566162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,12288,0.1932506693734063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,51200,0.773947556813558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,10240,0.09753155708312988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,8192,0.012144000165992312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,7168,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,65536,0.9838053385416666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,512,128,0.012339555554919772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,6144,0.010713777608341642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,10240,0.16246133380466038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,8192,0.1328266726599799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,5120,0.009313777916961247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,7168,0.06863022512859769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,7168,0.11816710895962185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,4096,0.007976888782448238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,6144,0.10455199744966294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,6144,0.059193776713477246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,3584,0.007267555428875818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,5120,0.049271110031339854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,5120,0.09016888671451145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,4096,0.040766222609413996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,3072,0.006623999940024481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,4096,0.07585155301623873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,2560,0.006281777802440856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,3584,0.06770310799280803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,3072,0.060043553511301674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,3072,0.03173955612712436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,2048,0.005569777968857024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,2560,0.028140445550282795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,2560,0.05374933282534281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,1536,0.004884444591071871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,2048,0.025072889195548162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,2048,0.04744266801410251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,1024,0.004202666795916027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,1536,0.04008977942996555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,1536,0.020928000410397846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,768,0.003960000144110786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,1024,0.034224887688954674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,1024,0.017608000172509086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,512,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,768,0.015465777781274585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,768,0.030861334668265447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,256,0.0032142222755485107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,512,0.027076444692081873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,512,0.013773333695199756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,128,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,8192,0.07765599754121569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,256,0.012422222230169507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,256,0.02535999980237749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,65536,0.046161777443355985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,64,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,256,32,0.0029519999192820657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,256,128,0.021270222134060327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,128,0.011792889071835412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,65536,0.036834667126337685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,51200,0.029271999994913738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,32,0.011736888852384357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,16384,0.012757333616415659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,3584,0.035191999541388616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,16384,0.16410133573744032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,12288,0.01092355532778634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,51200,0.4953342013888889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,65536,0.6310773425632054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,10240,0.01032977799574534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,12288,0.11940977308485244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,12288,0.19295644760131836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,51200,0.7735902468363444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,8192,0.009297777381208207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,10240,0.09638844596015082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,65536,0.9840720494588217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,7168,0.00869777798652649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,10240,0.1619902186923557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,6144,0.008329778081840938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,8192,0.07714933156967163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,8192,0.13231200642055935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,5120,0.007824000385072496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,7168,0.11803644233279759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,256,64,0.011869333684444427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,6144,0.05892355574501885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,6144,0.1038622193866306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,4096,0.007637333538797166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,3584,0.007117333511511485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,5120,0.04825777808825175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,5120,0.08988710906770493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,3072,0.006636444479227066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,4096,0.04007644454638163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,4096,0.07448799742592706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,2560,0.00590844452381134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,3584,0.03506133291456435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,3584,0.06786577569113837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,2048,0.00554666668176651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,3072,0.059895998901791044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,3072,0.03190933333502875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,1536,0.004592000196377437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,2560,0.05341066585646736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,2560,0.028107557031843398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,1024,0.004238222208287981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,2048,0.04725333385997348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,2048,0.025077333052953083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,1536,0.04011022382312351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,768,0.0038924444880750445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,1024,0.017528888252046373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,1024,0.034544888469907976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,512,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,768,0.03018488817744785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,768,0.015110222829712762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,256,0.003144888828198115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,512,0.013813333378897773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,512,0.02706844442420536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,128,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,256,0.024346666203604803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,256,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,64,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,128,0.011791999969217511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,128,0.022319111559126113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,7168,0.06814489099714491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,128,32,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,65536,0.033470223347345986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,64,0.012040889097584618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,51200,0.027746667464574177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,32,0.011775111158688864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,16384,0.012216889195972018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,12288,0.010123555858929953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,16384,0.16365688376956516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,10240,0.009370666411187913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,12288,0.11951911449432373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,8192,0.008638222184446123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,7168,0.00828888929552502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1280,128,16384,0.26090312004089355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,51200,0.49452887641059023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,6144,0.007664889097213745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,10240,0.09647288587358262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,128,1536,0.020938666330443487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,5120,0.008280889027648503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,4096,0.007283555964628856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,7168,0.06810755862130059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,3584,0.007198221981525421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,3072,0.006302222195598815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,6144,0.0585742195447286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,5120,0.04798310995101929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,2560,0.00590133335855272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,2048,0.005215999980767568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,3584,0.03497688968976339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,3072,0.03157155712445577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,1536,0.00453244439429707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,1024,0.0041964443193541635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,2560,0.027950220637851294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,768,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,2048,0.024724443753560383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,512,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,1536,0.020805334051450092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,1024,0.017515555024147034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,768,0.015255111787054272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,128,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,512,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,64,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,256,0.012113778127564324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,32,0.0028968888024489083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,128,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,64,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,65536,0.03187288840611776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,32,0.011702222128709158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,65536,0.6308159828186035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,16384,0.009304000271691216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,4096,0.03868088788456387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,12288,0.01238844460911221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,16384,0.16401067044999865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,51200,0.49497069252861875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,65536,0.62973419825236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,10240,0.011086222198274402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,8192,0.00998755544424057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,7168,0.009371555513805812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,12288,0.11865954928927952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,10240,0.09552355607350667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,64,256,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,8192,0.0768151084582011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,6144,0.008671999805503422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,5120,0.008288000192907121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,4096,0.007585778004593319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,7168,0.06815999746322632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,3584,0.007616000043021307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,3072,0.006284444282452266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,6144,0.05861333343717787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,5120,0.04876177840762668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,2560,0.005974222388532426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,4096,0.04016444418165419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,2048,0.005221333354711533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,3584,0.03495111068089803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,1536,0.004519999855094486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,3072,0.031397332747777305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,1024,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,51200,0.026183111800087824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,768,0.0035377778112888336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,2560,0.02794933319091797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,512,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,1536,0.020682666036817763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,1024,0.01717066599263085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,768,0.015160888433456421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,128,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,512,0.01349955548842748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,64,0.0024986666523747975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,64,8192,0.07721689012315539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,32,0.002516444358560774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,128,0.011689778003427716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,64,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,32,0.01145511120557785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,2048,0.024811555941899616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1280,32,256,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1280,32,256,0.012396444049146442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,16384,1.2416808870103624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,12288,0.9168586730957031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,16384,1.6008408864339192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,10240,0.7495955361260308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,8192,0.6448293262057835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,12288,1.1319315168592665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,10240,0.9482569164699979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,7168,0.5794151094224718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,8192,0.7547333505418566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,6144,0.42815200487772626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,7168,0.6688684357537164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,5120,0.4317857689327664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,6144,0.5572266578674316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,4096,0.3317280080583361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,5120,0.4670880105760362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,3072,0.2507750988006592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,3584,0.3236328760782878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,2560,0.20111466778649223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,3072,0.28041421042548287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,2560,0.24028176731533477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,51200,4.001223246256511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,2048,0.16292088561587864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,1536,0.13239199585384792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,1024,0.08908710877100627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,2048,0.1970062255859375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,768,0.07614044348398845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,1024,0.11913243929545085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,768,0.09717333316802979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,512,0.06174311372968885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,256,0.04203822215398153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,3584,0.29584889941745335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,128,0.033407999409569636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,1536,0.16295822461446127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,512,0.08454222149319118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,32,0.030258665482203167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,256,0.07684710952970716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,4096,0.3715928925408258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,65536,64,0.028134223487642076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,64,0.07230044735802545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,32,0.07187733385297987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,51200,5.442871941460504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,16384,0.9473288853963217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,65536,128,0.07209955321417914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,16384,1.2808604770236545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,12288,0.7318657769097222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,10240,0.5590853161282009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,8192,0.5064489046732584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,12288,0.9178222020467123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,10240,0.7488808631896973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,7168,0.43195377455817324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,8192,0.617103099822998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,6144,0.34252532323201496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,7168,0.5104364289177789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,5120,0.2878204451666938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,51200,3.1048240661621094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,4096,0.22671111424763998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,6144,0.4616053369310167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,5120,0.40821509891086155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,3584,0.24230488141377768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,4096,0.310811546113756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,3072,0.19564621978335908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,3584,0.2593617704179552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,2560,0.16721955935160318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,3072,0.23330754703945586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,2048,0.1326106654273139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,2560,0.20171199904547799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,1024,0.07124444511201647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,2048,0.15894222259521484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,65536,4.039280785454644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,768,0.06071199973424276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,1536,0.12861600187089708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,1024,0.09741066561804877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,1536,0.1002417802810669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,128,0.02715555495686001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,256,0.034267554680506386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,64,0.02276533345381419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,51200,4.176998138427734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,256,0.06332711378733318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,512,0.05673333009084066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,128,0.05976711379157173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,512,0.0698417756292555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,64,0.05919555823008219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,32,0.05912533071306017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,16384,0.31293511390686035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,768,0.07932266924116346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,51200,65536,5.572977701822917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,16384,0.4611208703782823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,51200,1.0611866845024955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,51200,32,0.02327199942535824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,12288,0.2356568972269694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,10240,0.2148817777633667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,65536,1.5092204411824544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,8192,0.19525067011515299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,12288,0.3476817872789171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,10240,0.30394577980041504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,7168,0.1551884412765503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,6144,0.15436444017622206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,8192,0.2237786716885037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,5120,0.11761866675482856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,51200,1.5582159890068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,4096,0.10069777568181355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,6144,0.17421955532497832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,7168,0.219995551639133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,5120,0.16099466217888728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,3072,0.07872266901863946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,2560,0.061390221118927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,3584,0.10617599884668986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,65536,1.9378337860107422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,2048,0.04976000057326423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,1536,0.04068266683154636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,3072,0.09552622503704494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,1024,0.027287110686302185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,2560,0.09836266438166301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,768,0.021583999196688335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,2048,0.06788977649476793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,512,0.016861332787407767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,256,0.013332444760534497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,1024,0.043396443128585815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,768,0.03674133287535773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,128,0.010703110860453712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,512,0.029878222280078467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,64,0.009402666654851701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,32,0.009674666656388177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,128,0.026731555660565693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,64,0.02563200063175625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,32,0.025757332642873127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,16384,3584,0.07898400227228801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,4096,0.11925066841973199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,16384,0.21595022413465711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,51200,0.7890542348225912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,1536,0.055973331133524575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,65536,0.9555617438422309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,12288,0.21730132897694907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,16384,256,0.026738666825824316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,12288,0.2728933228386773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,16384,0.36851734585232204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,8192,0.11072711149851482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,7168,0.09685689210891724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,10240,0.29086844126383465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,6144,0.08400799830754598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,8192,0.18347644805908203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,7168,0.16236178080240884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,65536,1.569917360941569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,5120,0.0829662217034234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,51200,1.236512925889757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,4096,0.07052266597747803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,3584,0.06242577897177803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,6144,0.15795021586947972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,3072,0.05255822340647379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,5120,0.1207653284072876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,4096,0.09905066755082871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,2560,0.045400000280804105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,3584,0.08784977595011394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,2048,0.036686221758524575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,1024,0.021033777130974665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,3072,0.07795911365085177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,2560,0.06881155570348103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,768,0.017850667238235474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,2048,0.056652446587880455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,512,0.013799111048380533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,256,0.010072888599501716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,1536,0.046055999067094594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,128,0.008562666674455007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,1024,0.03530755639076233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,64,0.007583111524581909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,512,0.02568799919552273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,32,0.007409777906205919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,256,0.02296977738539378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,10240,0.17082756095462373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,64,0.02212711175282796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,128,0.0222746663623386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,32,0.02198933396074507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,16384,0.20946044392055937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,16384,0.3285173310173882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,12288,0.15915555424160427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,51200,0.6103537877400717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,65536,0.7705938021341959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,10240,0.14913511276245117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,12288,1536,0.03064889046880934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,12288,0.2406888802846273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,8192,0.1395662228266398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,7168,0.11262310875786676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,10240,0.21661067008972168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,12288,768,0.030023111237419978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,7168,0.1440204381942749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,5120,0.08466400040520562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,6144,0.1251351171069675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,4096,0.06479733520083956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,65536,1.3844667010837133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,3584,0.05888622336917453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,5120,0.10660622517267863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,3072,0.049499554766549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,4096,0.09206577804353501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,2560,0.03913155529234145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,3584,0.0798835555712382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,2048,0.03433333171738519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,1536,0.02628444466325972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,3072,0.0703022215101454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,1024,0.019302222463819716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,768,0.015615999698638916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,2048,0.0502106679810418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,1536,0.04203200009134081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,512,0.012318222059143914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,1024,0.03198044498761495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,256,0.008665777742862701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,768,0.027795556518766616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,128,0.007429333196745978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,512,0.023601777023739282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,64,0.006643555644485686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,256,0.02127733329931895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,32,0.006608888920810487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,128,0.020639111598332722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,64,0.02036355601416694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,8192,0.16542932722303602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,51200,1.0879440307617188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,65536,0.657518227895101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,51200,0.5074453353881836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,2560,0.06106133593453301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,16384,0.17496977912055123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,12288,0.13886222574445936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,16384,0.29873866505093044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,10240,0.10587910811106364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,8192,0.08289777570300631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,65536,1.19814576043023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,12288,0.24543823136223686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,51200,0.9411057366265191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,10240,6144,0.10433510939280193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,7168,0.07767733600404528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,6144,0.07070133421156141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,10240,0.1783884498808119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,5120,0.05415822068850199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,4096,0.04597244328922696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,8192,0.1413724422454834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,7168,0.13015645080142552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,3584,0.041794667641321816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,3072,0.038035555018319026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,5120,0.09471199909845988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,2560,0.03302755620744493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,4096,0.07643466525607638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,2048,0.02812266680929396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,6144,0.11006400320265029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,1536,0.023220444718996685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,3072,0.061231997278001576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,1024,0.017893332574102614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,2560,0.05361955695682102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,768,0.015547555353906421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,2048,0.043920000394185386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,512,0.012367111113336353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,1536,0.03706222110324436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,1024,0.028730667299694482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,128,0.0074826669361856245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,768,0.025088000628683303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,512,0.021334222621387903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,64,0.00657066661450598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,256,0.01947733263174693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,32,0.00683111117945777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,128,0.01867288847764333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,32,0.018557333283954196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,64,0.018550222118695576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,16384,0.1439911127090454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,10240,32,0.020317332612143624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,65536,0.5032551023695204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,12288,0.1112720039155748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,51200,0.40398311614990234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,10240,0.09810133112801446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,16384,0.2660035557217068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,8192,3584,0.07004000080956353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,8192,0.07925955454508464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,7168,0.0649626652399699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,10240,0.16250756051805285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,12288,0.20499022801717123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,6144,0.0569795568784078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,8192,256,0.008624888956546783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,5120,0.04650577902793884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,7168,0.11717066499922012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,4096,0.03783644570244683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,3584,0.03404266635576884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,6144,0.10560977458953857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,3072,0.028839111328125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,2560,0.024753777517212763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,3584,0.06257777743869357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,3072,0.05936621957355075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,2048,0.021225778592957392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,1536,0.016916443904240925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,2560,0.05036266644795736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,1024,0.012984889249006907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,2048,0.04200889004601372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,1536,0.03466577662361993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,768,0.010770666930410596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,512,0.008281778130266402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,1024,0.027316444449954565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,256,0.0069217777086628815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,768,0.023345778385798138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,512,0.02027466727627648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,128,0.006069333189063602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,64,0.005613333235184352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,256,0.018603555030292936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,7168,32,0.005605333381228977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,128,0.017870222528775532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,64,0.0181404451529185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,8192,0.13175288836161295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,32,0.017864000466134813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,51200,0.867378658718533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,65536,1.1118649376763237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,5120,0.08831644720501369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,7168,4096,0.07527377870347765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,65536,0.46050935321384007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,51200,0.3779306676652696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,12288,0.08339733547634548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,10240,0.09268089135487874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,16384,0.24645598729451498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,8192,0.07639377646976046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,12288,0.21234667301177979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,10240,0.15040444003211126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,7168,0.06473600202136569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,6144,0.048820445934931435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,8192,0.12210222085316975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,5120,0.040998223755094744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,51200,0.794382201300727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,7168,0.11843466758728027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,4096,0.03495644529660543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,3584,0.03274844421280755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,6144,0.09991733233133952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,5120,0.08261777957280476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,3072,0.02880177895228068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,4096,0.06772266493903266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,3584,0.058964444531334766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,2048,0.02017244365480211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,3072,0.0534728897942437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,2560,0.04849777619043986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,1024,0.013028444515334235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,2048,0.039120889372295804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,768,0.010776888993051318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,1536,0.03308444552951389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,512,0.008159110943476358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,1024,0.025739555557568867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,16384,0.11481689082251655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,256,0.006623111251327727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,128,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,768,0.022288888692855835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,64,0.005210666606823604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,512,0.019256000717480976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,256,0.01756088932355245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,128,0.01737955543729994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,64,0.016943110360039603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,32,0.016528889536857605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,6144,65536,1.019595570034451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,65536,0.418870210647583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,51200,0.3362773259480794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,2560,0.024255999260478552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,16384,0.10803021987279256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,12288,0.08079910940594144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,1536,0.016421332955360413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,10240,0.07379466957516141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,16384,0.22529599401685926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,8192,0.06326133012771606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,12288,0.16935200161404082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,10240,0.13897244135538736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,7168,0.05433244506518046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,65536,0.9266835318671333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,6144,0.0448000000582801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,8192,0.11396977636549209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,5120,0.03999377621544732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,7168,0.10423733128441705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,6144,32,0.0052728888889153796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,4096,0.031042665243148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,3584,0.02942488922013177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,6144,0.08957955572340225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,3072,0.026198221577538386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,2560,0.021362667282422382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,5120,0.0760986672507392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,2048,0.018194667167133756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,3584,0.05436444282531738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,1536,0.01513777838812934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,3072,0.04878488845295376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,1024,0.011178666518794166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,2560,0.043213334348466664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,768,0.009656888743241629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,2048,0.036361777120166354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,1536,0.03065955638885498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,1024,0.02329866588115692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,256,0.0064088888466358185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,768,0.020960888928837244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,128,0.005559111220969095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,512,0.01826133330663045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,64,0.004873777843183941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,32,0.005220444252093633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,128,0.016377778516875375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,64,0.016166221764352586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,32,0.01585422290696038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,65536,0.34984178013271755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,51200,0.28145599365234375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,51200,0.7271511289808484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,16384,0.09544799725214641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,12288,0.0735057791074117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,16384,0.20509866873423258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,10240,0.05895911322699653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,5120,512,0.00794488853878445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,65536,0.8369848993089465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,12288,0.15596266587575278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,7168,0.04452266626887851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,51200,0.6626159879896376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,6144,0.038485334979163274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,8192,0.10372000270419651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,10240,0.12665955225626627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,7168,0.09609511163499619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,5120,0.032348444064458214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,4096,0.027496889233589172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,3584,0.025120000044504803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,6144,0.08118755287594266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,3072,0.021317332983016968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,5120,0.06906400124231975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,4096,0.05619555711746216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,2560,0.018446221947669983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,3584,0.05079822076691521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,2048,0.015820443630218506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,3072,0.0444160004456838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,1536,0.013080000049538083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,2560,0.03975466556019253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,1024,0.010035555395815108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,768,0.008620444271299574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,2048,0.03314222229851617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,1536,0.02819377846188015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,512,0.007252444823582967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,1024,0.021653332644038733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,256,0.005608888963858287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,4096,0.06226666768391927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,128,0.004925333377387789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,768,0.019840889506869845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,64,0.004879111217127906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,512,0.01723377737734053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,32,0.0046880000995265115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,256,0.015784000356992085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,128,0.01518311103185018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,64,0.015104888214005364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,4096,8192,0.048248890373441905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,4096,32,0.014899555179807874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,16384,0.07990755637486775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,65536,0.2998044490814209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,51200,0.20825866858164468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,5120,256,0.01682222220632765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,12288,0.05626222160127428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,10240,0.04708533485730489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,8192,0.03889688849449158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,16384,0.19426400131649443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,7168,0.03436000148455302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,6144,0.029817776547537908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,10240,0.12024533748626709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,5120,0.024857777688238356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,8192,0.0991742213567098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,7168,0.08814577923880683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,4096,0.020806221498383414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,51200,0.6174577607048882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,6144,0.0770675539970398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,65536,0.7895750999450684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,3072,0.017078222499953378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,5120,0.0651057759920756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,2560,0.015066666735543145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,4096,0.05340800020429823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,2048,0.012874667015340594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,3584,0.04777422216203478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,1536,0.010643555886215635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,1024,0.00833777752187517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,3072,0.04235644472969902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,2560,0.0379671123292711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,2048,0.03189599845144484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,768,0.006973333656787872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,512,0.006222222414281633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,256,0.005195555587609609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,1024,0.020960888928837244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,768,0.018921777606010437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,512,0.016759110821617972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,64,0.0038924444880750445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,256,0.015462223026487561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,128,0.014881778094503613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,64,0.014840889308187695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,32,0.014446222119861178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,65536,0.23753955629136828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,3584,0.01891999940077464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,51200,0.17942310704125297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,16384,0.07088889016045465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,1536,0.026455110973782007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,65536,0.7472782135009766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,16384,0.19629244009653726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,12288,0.05214488837454054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,10240,0.04177244504292806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,8192,0.03386666708522373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,51200,0.5865857866075304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,32,0.0042444442709287005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,12288,0.13496800263722739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,10240,0.11361422803666855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,6144,0.025560888979170058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,5120,0.023935111032591924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,8192,0.09767022397783066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,7168,0.08315555254618327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,4096,0.01940088967482249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,6144,0.07271199756198458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,3584,0.01771377854877048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3584,12288,0.14978133307562932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,3072,0.015936889582210116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,2560,0.013656888571050433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,4096,0.050373332368003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,3584,0.04499199986457825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,3072,0.040287110540601946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,2048,0.011683555940786997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,2560,0.03586311141649882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,1536,0.009655999640623728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,1024,0.0075902218619982404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,2048,0.029508444997999404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,768,0.00657066661450598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,1536,0.025776000486479864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,512,0.005550222264395819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,1024,0.01995733380317688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,256,0.004824000100294749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,128,0.0042462220622433555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,768,0.018180444836616516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,512,0.016183111402723525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,64,0.003899555653333664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,256,0.015126221709781222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,32,0.0039013334446483185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,128,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,64,0.014477334088749357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,32,0.014146667387750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3072,7168,0.030279109875361126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,65536,0.2333448992835151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,16384,0.05453955464892917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,51200,0.16939732763502333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,12288,0.04377333323160807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,10240,0.03853866789076064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,3072,5120,0.061370664172702365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,16384,0.17440622382693818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,8192,0.03158222304450141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,12288,0.12745066483815512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,7168,0.027954667806625366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,6144,0.024712888730896845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,10240,0.1076986657248603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,65536,0.7029129134284126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,8192,0.0879146655400594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,5120,0.021380444367726643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,7168,0.0784097777472602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,4096,0.018265777164035372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,3584,0.016580444243219163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,6144,0.06848444541295369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,3072,0.014984889162911309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,5120,0.057258665561676025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,2560,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,2048,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,3584,0.042520887321896024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,4096,0.04742666747834948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,1536,0.009658666948477427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,3072,0.0381022228135003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,1024,0.007618666523032718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,3584,128,0.004558222161398994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,2560,0.033258666594823204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,768,0.006962666908899943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,2048,0.02832177612516615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,1536,0.023934221929974023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,512,0.005605333381228977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,256,0.004882666799757215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,128,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,1024,0.019259555472267997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,64,0.0038862224254343244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,768,0.018065777089860704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,512,0.015501333607567681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,256,0.014543111125628153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,128,0.014144000079896716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,64,0.014106666048367819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,32,0.014138667119873894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,65536,0.1981519990497165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,51200,0.16455554962158203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,16384,0.05271644393603007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,12288,0.04120799899101257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,10240,0.0347324444188012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,16384,0.16621689001719156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,12288,0.11961421701643203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,8192,0.028190222051408555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2560,51200,0.5508249070909288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,7168,0.024520888924598694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,10240,0.10071200132369995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,51200,0.5139813423156738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,6144,0.021828444467650518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,5120,0.020834666159417894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,65536,0.6586853133307563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,4096,0.016297777493794758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,7168,0.0732311142815484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,3584,0.01475822263293796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,3072,0.01311377767059538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,5120,0.05437155564626058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,2560,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,4096,0.04510577850871616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,3584,0.040213333235846624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,2048,0.010000000397364298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,1536,0.008656889200210571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,2560,0.031154665682050917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,1024,0.0069724445541699724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,2048,0.026549332671695288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,768,0.005904888941182031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,1536,0.022685334086418152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,512,0.005223111146026188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,1024,0.018241778016090393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,256,0.0042364444169733255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,768,0.01699822147687276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,512,0.015115555789735583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,128,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,256,0.014045332868893942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,64,0.003573333223660787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,128,0.013560888667901358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2048,32,0.0035822221802340615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,64,0.013431111143694984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,32,0.013279111021094851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,8192,0.0825857785012987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,65536,0.17572177780999076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,6144,0.06372088856167264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,51200,0.13441777229309082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,16384,0.04446577694680956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,12288,0.03356800145573086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,2048,3072,0.03598577777544657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,10240,0.028912888632880315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,2560,32,0.0038862224254343244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,8192,0.02314222190115187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,12288,0.11208000448015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,7168,0.020592000749376085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,51200,0.47805510626898867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,10240,0.09394222497940063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,65536,0.6112560166252984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,6144,0.01889155473974016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,5120,0.016237333416938782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,4096,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,8192,0.07694400019115873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,3584,0.012462221913867526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,7168,0.06832266516155668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,3072,0.011579555769761404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,6144,0.05886755386988322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,2560,0.009642666412724389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,4096,0.040864888164732195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,2048,0.008341333104504479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,3584,0.03765155540572272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,1536,0.007261333366235097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,1024,0.0059573331640826324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,2560,0.029297779003779095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,2048,0.025290666355027094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,768,0.005559111220969095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,512,0.004825777891609403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,1536,0.021319111188252766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,1024,0.017183999220530193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,256,0.004184000194072723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,128,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,768,0.016143111719025504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,64,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,512,0.014775110615624322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1536,32,0.003571555432346132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,256,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,128,0.01312711089849472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,64,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,32,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,65536,0.13748355706532797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,16384,0.040349334478378296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,51200,0.10985155238045587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,12288,0.03358844584888882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,16384,0.14335021707746717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,12288,0.10351377725601196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,10240,0.0270453327231937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,65536,0.5642293294270834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,8192,0.02123022245036231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,5120,0.05062399970160591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,7168,0.018505778577592637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,6144,0.01640888883007897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,10240,0.08745955758624607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,3072,0.03352800011634827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,5120,0.014816888504558139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,4096,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,7168,0.06294666396247016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,6144,0.05428533421622383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,3584,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,3072,0.010010666317409938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,5120,0.04600355691379971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,2560,0.008946666287051307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,4096,0.03809422254562378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,2048,0.007992000215583378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,3072,0.030208001534144085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,1536,0.006903999795516332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,2560,0.027457776996824477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,1024,0.005209777918126848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,2048,0.02366133365366194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,768,0.004917333523432414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,1536,0.020428443948427837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1536,16384,0.15299822224511042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,512,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,1024,0.016524444023768108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,256,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,768,0.015452444553375244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,512,0.014146667387750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,256,0.0131217779384719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,64,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,128,0.012727999852763282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,32,0.0033573332346147964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,51200,0.44253333409627277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,64,0.012618666721714867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,65536,0.09692977534400092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,32,0.012072000238630505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,51200,0.0776053335931566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,8192,0.07138578097025554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,16384,0.14072355959150526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,1024,3584,0.03489244315359328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,51200,0.4390008979373508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,10240,0.024439111351966858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,65536,0.5581128862169054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,8192,0.018908444378111098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,7168,0.018100443813535903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,12288,0.10303288698196411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,6144,0.01482488877243466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,8192,0.07040977478027344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,5120,0.01311822235584259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,7168,0.06179110871420967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,1024,128,0.0034417777011791864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,4096,0.010100444157918295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,6144,0.05342222253481547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,3584,0.009374221993817223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,3072,0.00833777752187517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,5120,0.04496711161401537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,4096,0.03715288970205519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,2560,0.007807999849319458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,2048,0.006679111056857639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,3072,0.030082666211658057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,1536,0.005948444621430502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,2560,0.027427555786238775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,16384,0.030672887961069744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,2048,0.023382221659024555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,768,0.004590222405062782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,1536,0.020248000820477802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,512,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,1024,0.01647733317481147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,768,0.015488000379668342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,512,0.013791999883121915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,12288,0.029537777105967205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,128,0.0031866667171319327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,256,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,64,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,32,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,128,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,64,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,10240,0.08687111404207017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,32,0.012088889049159156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,65536,0.07083821958965726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,16384,0.022441777918073866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,51200,0.057242665025922984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,12288,0.019409777389632333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,16384,0.13132088714175755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,768,3584,0.03388533327314589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,10240,0.01640266676743825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,12288,0.09544177850087483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,8192,0.01366666704416275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,51200,0.40731022093031144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,7168,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,65536,0.5184355311923557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,6144,0.01130222198035982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,1024,0.00498577786816491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,5120,0.010259555445777046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,10240,0.07967199881871541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,4096,0.008369777765538957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,3584,0.007923555870850882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,7168,0.05681066380606758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,3072,0.0070222218831380205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,5120,0.0424231125248803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,768,256,0.0035537779331207275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,2560,0.006598222172922558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,4096,0.03463110989994473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,2048,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,3584,0.03159111075931125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,1536,0.005224888937340842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,3072,0.028151111470328435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,1024,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,768,0.003900444342030419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,2560,0.025711110896534387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,2048,0.022294221652878657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,512,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,1536,0.019254222512245178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,256,0.0034835553831524322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,1024,0.01550044450494978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,768,0.01479111115137736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,512,0.013404444687896304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,256,0.012418666647540199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,32,0.003142222141226133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,128,0.01203644441233741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,65536,0.04184088773197598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,64,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,32,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,16384,0.0151555554734336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,16384,0.13057955106099448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,12288,0.013453333742088742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,8192,0.06502844227684869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,51200,0.40601332982381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,65536,0.5164835717942979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,10240,0.01236355553070704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,8192,0.011328889264000786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,512,6144,0.04880977670351664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,7168,0.011764444410800934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,6144,0.010374222364690568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,12288,0.09445155329174465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,10240,0.07885333564546373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,5120,0.009090666969617208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,8192,0.0642133355140686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,7168,0.05629777908325195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,4096,0.007963555554548899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,6144,0.04786755641301473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,3584,0.007305777735180325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,512,128,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,5120,0.04114133450720046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,3072,0.006593777901596493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,2560,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,2048,0.0052284445199701525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,3584,0.03109333250257704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,3072,0.027757333384619817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,1536,0.004734222259786394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,2560,0.025376889440748427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,51200,0.03366311060057746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,2048,0.022016000416543748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,768,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,512,0.0034888887570963967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,1024,0.01552088889810774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,256,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,768,0.014854222536087036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,512,0.01314133322901196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,128,0.0031848889258172777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,64,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,256,0.012158222496509552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,32,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,128,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,64,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,65536,0.034380445877710976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,51200,0.027239110734727647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,32,0.011607111328177981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,16384,0.01237155579858356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,16384,0.13048711087968615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,4096,0.033569776349597506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,12288,0.010609777437316047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,10240,0.00997866690158844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,51200,0.4056391186184353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,8192,0.009031111167536842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,256,1024,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,12288,0.09423110882441203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,7168,0.008676444490750631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,10240,0.07869599925147162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,256,1536,0.018928888771269057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,6144,0.007987555530336168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,8192,0.06451911396450467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,5120,0.008665777742862701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,4096,0.008119111259778341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,7168,0.05580088827345106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,3584,0.007479999628331926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,6144,0.047897779279285006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,5120,0.04055555661519369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,3072,0.006593777901596493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,4096,0.03327466713057624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,2560,0.005904888941182031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,2048,0.00555377784702513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,3584,0.03115288747681512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,1536,0.004648888690604104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,3072,0.02776088813940684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,1024,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,768,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,1536,0.019172444939613342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,1024,0.01551999979548984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,768,0.014719999498791166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,256,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,128,0.0028000000036425064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,512,0.013131555583741931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,256,0.012092444631788464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,64,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,128,0.012063110868136087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,65536,0.5156319936116537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,65536,0.03230133321550157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,64,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,51200,0.024775111012988623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,16384,0.011868444581826528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,16384,0.13022755251990423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,12288,0.010334221853150262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,51200,0.4048079914516873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,10240,0.009374221993817223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,65536,0.5155102411905924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,8192,0.008649778034951951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,2560,0.025438222620222304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,2048,0.02181422213713328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,12288,0.0933342244890001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,7168,0.008287111090289222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,6144,0.007608888877762689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,10240,0.07830222447713216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,5120,0.008963555925422246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,8192,0.06379377841949463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,4096,0.007666666474607255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,7168,0.055573330985175244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,3584,0.006960888703664144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,3072,0.006309333360857434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,5120,0.03977333174811469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,2560,0.005865777946180767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,4096,0.03330577744377984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,128,32,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,2048,0.0052391112678580815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,3072,0.027760000692473516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,1536,0.004559999952713649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,2560,0.025021332833502028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,1024,0.003907555507289039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,128,32,0.011736888852384357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,2048,0.021887110339270696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,768,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,1536,0.01891999940077464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,512,0.0033982222278912864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,256,0.0028942223224374983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,1024,0.015458666616015963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,768,0.014550222290886773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,128,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,512,0.013062222136391534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,32,0.0028906667398081887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,256,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,128,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,65536,0.027462222509913977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,64,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,51200,0.02051111062367757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,32,0.011394666300879585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,16384,0.013861333330472311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,12288,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,16384,0.1301342248916626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,10240,0.011407111254003314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,12288,0.09360622035132514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,6144,0.04823644293679131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,8192,0.009717333647939894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,51200,0.40513867802090114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,7168,0.012431999875439538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,65536,0.5154666900634766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,6144,0.011024889018800525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,5120,0.009711110757456886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,64,3584,0.03081688947147793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,8192,0.06407555606630114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,4096,0.009095999929640029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,7168,0.05506489011976454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,3584,0.008285333712895712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,6144,0.047545777426825635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,3072,0.007252444823582967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,5120,0.03948355714480082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,2560,0.006622222148709827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,4096,0.03389777739842733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,2048,0.006030222194062338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,3584,0.03080355458789402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,1536,0.004929777648713854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,3072,0.027698665857315063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,1024,0.00424799985355801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,2560,0.025408888856569927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,768,0.0038968887594011095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,2048,0.021967111362351313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,64,64,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,1536,0.018928888771269057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,256,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,1024,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,128,0.0028071111689011254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,64,0.0028479999552170434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,512,0.01309511148267322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,256,0.012084444363911947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,32,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,128,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,64,0.011425777441925473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,32,0.011424000064531961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,10240,0.07795821958118014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1025,32,512,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1025,32,768,0.014710222681363424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,16384,1.2015697691175673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,12288,0.8578817579481336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,16384,1.4908035066392686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,12288,1.0833173327975802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,10240,0.7057857513427734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,8192,0.6238257620069716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,10240,0.8941173553466797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,51200,3.821143256293403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,16384,1.3436720106336806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,7168,0.5447200139363607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,12288,0.9360444810655383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,8192,0.7202693091498481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,10240,0.802376005384657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,7168,0.6443795628017849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,6144,0.43055910534328884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,51200,5.027509477403429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,6144,0.5239351060655382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,8192,0.6344666481018066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,5120,0.35490579075283474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,4096,0.2859608862135145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,5120,0.4978826840718587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,4096,0.37617156240675187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,3584,0.2509182294209798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,6144,0.48685513602362734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,5120,0.4060408804151747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,3584,0.3202586703830295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,3072,0.23205688264634874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,7168,0.5609502262539333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,4096,0.3357128832075331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,2560,0.1803804503546821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,3072,0.28096532821655273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,3584,0.29887912008497447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,2560,0.26859821213616264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,1536,0.1328844494289822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,2048,0.1883466641108195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,3072,0.268887996673584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,2560,0.22680534256829155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,1024,0.07890844345092773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,2048,0.19209333260854086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,1536,0.1556560066011217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,1536,0.15283821688758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,768,0.07235733005735609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,512,0.05195555422041151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,1024,0.1192951069937812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,768,0.09417244460847642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,768,0.10361422432793511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,256,0.03569333420859443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,512,0.08114044533835517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,512,0.0855226649178399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,128,0.03176444437768724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,256,0.07023555702633329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,256,0.07510133584340413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,64,0.0269804447889328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,128,0.058499554793039955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,32,0.027433777848879497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,65536,2048,0.15209600660536024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,64,0.06877422332763672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,128,0.0692382189962599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,32,0.068667557504442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,65536,1024,0.1164062288072374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,65536,51200,4.319367302788629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,16384,1.0190426508585613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,51200,3.1403901841905384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,65536,4.050179375542535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,51200,3.978246900770399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,12288,0.7138097551133898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,16384,1.206266615125868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,10240,0.5759244494967991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,65536,5.134314643012153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,12288,0.8487164709303113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,10240,0.7051848835415311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,8192,0.4869413375854492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,16384,1.0354080200195312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,8192,0.552188449435764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,12288,0.8008924590216743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,7168,0.4518124262491862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,7168,0.5091395378112793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,6144,0.3504622247483995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,10240,0.636007097032335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,6144,0.4839279916551378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,5120,0.2990017731984456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,7168,0.4550151295132107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,4096,0.2615191141764323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,5120,0.3904000123341878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,4096,0.2845066653357612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,6144,0.3925208780500624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,3584,0.23520533243815103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,5120,0.3355244530571832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,3584,0.2473075654771593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,3072,0.1900035540262858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,2560,0.15599200460645887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,8192,0.5117795732286241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,3584,0.24715020921495226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,4096,0.278801785575019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,3072,0.21541689501868355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,3072,0.22263201077779135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,2048,0.13360710938771567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,2560,0.21363288826412627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,1536,0.09863377941979302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,51200,3.505982293023003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,2048,0.15329689449734157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,1024,0.06876355409622192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,2560,0.18598133987850615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,768,0.052594665024015635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,1536,0.12260533703698052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,2048,0.1557528840170966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,1536,0.13299555248684353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,512,0.039239999320771955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,1024,0.10098399718602498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,256,0.028652442826165095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,768,0.08979466888639663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,1024,0.1012622250450982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,512,0.06668266985151503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,128,0.024655999408827886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,512,0.0748151143391927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,64,0.02251200046804216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,256,0.06026044156816271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,256,0.06051999992794461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,128,0.05033066537645128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,128,0.058733330832587353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,64,0.056758224964141846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,32,0.05688266621695625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,51200,65536,4.462233649359809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,51200,768,0.07657600111431546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,51200,1.001431147257487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,51200,32,0.0229066660006841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,65536,1.3107484181722004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,16384,0.29449155595567494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,12288,0.25390667385525173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,16384,0.4535031318664551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,65536,1.8472124735514324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,51200,1.4272249009874132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,10240,0.22899288601345488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,16384,0.4435911178588867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,10240,0.26935378710428876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,12288,0.3384062184227838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,8192,0.21785777144961885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,10240,0.2799057695600721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,7168,0.14259644349416098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,8192,0.22891643312242296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,7168,0.18944444921281603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,6144,0.13534843921661377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,12288,0.3194391197628445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,7168,0.2040088839001126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,5120,0.09505066606733535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,6144,0.16496266259087458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,4096,0.07732533084021674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,6144,0.1784728897942437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,5120,0.1403955618540446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,8192,0.17713244756062826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,5120,0.15461333592732748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,3584,0.07618933253818087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,4096,0.11449866824679905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,4096,0.12842488288879395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,3072,0.061384002367655434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,65536,1.8367351955837672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,3584,0.10235999690161811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,2560,0.051496889856126576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,3584,0.1173964473936293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,2048,0.042895999219682485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,3072,0.10476089186138576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,3072,0.09046933386060928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,2560,0.08283733659320407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,1536,0.03658488723966811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,2560,0.0916702217525906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,1024,0.024381332927280005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,2048,0.07932533158196343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,2048,0.06586844391292997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,1536,0.053284443087048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,1536,0.07027733325958252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,768,0.020397333635224234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,1024,0.04042933384577433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,512,0.015784889459609985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,1024,0.054435554477903575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,256,0.012599999705950419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,768,0.048691554201973804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,768,0.03433955709139506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,128,0.010400888820489248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,512,0.042075554529825844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,256,0.03609688745604621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,64,0.00925244473748737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,16384,32,0.009298666483826106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,128,0.025035555164019268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,64,0.025027554896142747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,32,0.024381332927280005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,51200,1.4223599963717992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,65536,0.8900453779432508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,512,0.028704888290829126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,16384,256,0.025754666990704004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,16384,128,0.03120533294147915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,51200,0.7312791082594129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,16384,0.2549591064453125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,65536,1.5046880510118272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,12288,0.1895537773768107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,16384,0.3519759972890218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,10240,0.14548267258538142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,12288,0.2608933448791504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,16384,0.4149191114637587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,10240,0.21669067276848686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,51200,1.187944836086697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,12288,0.306534210840861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,8192,0.1361866659588284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,7168,0.11947555012173122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,8192,0.17506399419572619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,6144,0.09989066918690999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,7168,0.15541156133015951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,10240,0.2544773419698079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,8192,0.20719644758436415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,5120,0.08186666833029853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,7168,0.186591108640035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,6144,0.13488533761766222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,4096,0.06047111087375217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,6144,0.16862311628129747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,5120,0.11645866764916314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,5120,0.14006666342417398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,4096,0.09583822223875259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,3072,0.0546960002846188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,4096,0.11733867062462701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,2560,0.04425866736306084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,3584,0.08626933230294122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,3584,0.10668355226516724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,3072,0.0756817791197035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,2048,0.03323555654949612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,3072,0.09617866410149468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,1536,0.028130667077170476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,2560,0.06589600112703112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,51200,1.2437591552734375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,2048,0.05429244372579786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,2048,0.07226400242911445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,1024,0.020403555697864957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,768,0.016647110382715862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,1536,0.06237955225838555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,1536,0.044300443596310086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,512,0.012530666258600024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,1024,0.0502017769548628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,768,0.029909332593282063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,768,0.04468977782461378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,256,0.012167111039161682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,512,0.03810844487614102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,512,0.025063999825053748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,128,0.01036177741156684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,256,0.03252799974547492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,256,0.02235288918018341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,64,0.009941333697901832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,128,0.021747555997636583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,32,0.007928888830873702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,128,0.028868443436092798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,12288,3584,0.05386311146948072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,64,0.02164977788925171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,32,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,65536,1.589005364312066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,12288,2560,0.08552000257703994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,51200,0.5975511338975694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,65536,0.8020390934414334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,12288,1024,0.0344453321562873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,16384,0.21217689249250624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,51200,1.0364809036254883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,12288,0.1602284378475613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,16384,0.33241955439249676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,65536,1.3178880479600694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,10240,0.13911555873023138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,16384,0.36582310994466144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,10240,0.19326755735609266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,8192,0.13074044386545816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,12288,0.28305066956414116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,10240,0.23413422372606066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,7168,0.10274489058388604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,8192,0.1562159988615248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,8192,0.18968533145056832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,6144,0.08027555545171101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,7168,0.14025155703226724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,7168,0.17099555333455405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,5120,0.07557066943910387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,6144,0.12081866794162327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,51200,1.1282640033298068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,4096,0.0643084446589152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,6144,0.1482879983054267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,5120,0.10416266653272842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,5120,0.12912089294857448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,3584,0.05228799912664625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,65536,1.4357769224378798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,4096,0.08699911170535618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,3072,0.047930667797724404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,4096,0.10820621914333767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,2560,0.03695199886957804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,3584,0.07794133159849378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,12288,0.23042755656772188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,3584,0.09892444478140937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,2048,0.031424889961878456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,3072,0.08867466449737549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,3072,0.06976711087756686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,2560,0.05942577785915799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,2560,0.07748799853854708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,1024,0.017658667431937326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,2048,0.06683378087149726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,2048,0.0483493341339959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,768,0.014476444986131458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,1536,0.05925244755215115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,1536,0.04054666558901469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,1024,0.031211555004119873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,512,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,256,0.008714666797055138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,768,0.026406221919589575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,768,0.041328890456093684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,128,0.0074924445814556545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,512,0.022634666826989915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,512,0.037263999382654824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,64,0.008616888688670265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,256,0.03070311082734002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,256,0.020651555723614164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,32,0.008608000146018134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,128,0.020230222079488967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,64,0.019904888338512845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,10240,32,0.019904888338512845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,65536,0.5917893515692817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,51200,0.4643404218885634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,10240,1536,0.02461244497034285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,16384,0.1700026724073622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,1024,0.04677333434422811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,16384,0.27636533313327366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,12288,0.13163467248280844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,65536,1.1521502600775826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,10240,128,0.027071999178992376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,10240,0.10690666569603814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,51200,0.8980844285753039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,8192,0.08870044681761001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,16384,0.33999911944071454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,10240,0.1688471105363634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,12288,0.24857955508761934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,7168,0.08250844478607178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,10240,0.20944621827867296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,8192,0.1367502212524414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,7168,0.12149333953857422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,6144,0.06881688700781928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,8192,0.17452088991800943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,5120,0.050847109821107656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,7168,0.15468000041113958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,6144,0.10611822207768758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,6144,0.13506933053334555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,5120,0.09098222520616318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,4096,0.04416799876425001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,3584,0.04012889001104567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,5120,0.11775999599032932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,65536,1.2973528967963326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,4096,0.09873244497511123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,3072,0.03707199957635667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,51200,1.0108871459960938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,3584,0.06748800145255195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,2560,0.029888000753190782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,3072,0.059537774986690946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,3072,0.08155200216505262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,12288,0.20197510719299316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,2048,0.02479822271400028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,2560,0.051543109946780734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,2560,0.07181511322657268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,1536,0.020094222492641874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,1024,0.014967110421922473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,2048,0.061271111170450844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,2048,0.04311466548177931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,1536,0.03604799840185378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,1024,0.027515555421511333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,1024,0.04344800114631653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,512,0.009686222506894005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,768,0.023933332827356126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,768,0.03771911064783732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,256,0.007320889168315464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,512,0.0207004447778066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,512,0.033281776640150286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,128,0.007785778078767989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,256,0.018930666976504855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,256,0.029492444462246362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,64,0.007289778027269576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,128,0.018254222141371835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,128,0.026520000563727483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,32,0.007540444533030192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,4096,0.07484977775149874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,64,0.018218666315078735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,3584,0.09001421928405762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,8192,32,0.01824711097611321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,8192,1536,0.05379822187953525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,65536,0.5808017518785265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,51200,0.4880666732788086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,16384,0.16494222482045492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,16384,0.29721956782870823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,51200,0.825742244720459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,65536,1.056863996717665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,12288,0.12440710597568089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,10240,0.1092462208535936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,12288,0.1881564458211263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,16384,0.33348978890313047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,8192,0.08859111203087701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,12288,0.24629510773552787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,10240,0.16440533267127141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,10240,0.20812977684868705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,8192,768,0.012544000314341651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,8192,0.12915644380781385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,8192,0.17033510737948945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,6144,0.06382311052746244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,7168,0.11454399426778157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,7168,0.15297067165374756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,65536,1.2777990765041776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,6144,0.10158310996161567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,5120,0.05295288893911573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,51200,1.0042977862887912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,4096,0.0437448885705736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,3584,0.03913155529234145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,5120,0.08665955728954738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,4096,0.07227022118038602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,5120,0.1162159972720676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,4096,0.09718755880991618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,3072,0.03393777873780992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,2560,0.02942488922013177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,3584,0.06217777729034424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,3584,0.0886382195684645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,3072,0.056406219800313316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,3072,0.07984977960586548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,2048,0.02495288848876953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,1536,0.020145777199003432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,2560,0.04909866717126635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,2560,0.07114311059315999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,1024,0.015478221906556023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,2048,0.06055111355251736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,2048,0.04083555605676439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,768,0.013010666602187686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,1536,0.05300800005594889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,512,0.009695111049546136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,1024,0.0262097782558865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,7168,0.07714044385486178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,768,0.03719910979270935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,256,0.007627555893527136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,512,0.0332568883895874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,512,0.0199991116921107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,128,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,256,0.028326223293940227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,256,0.018018666240904067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,64,0.007310222420427535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,128,0.017870222528775532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,128,0.026230222649044458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,7168,32,0.010000000397364298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,6144,0.13347910510169134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,64,0.017281777328915067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,32,0.01721955504682329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,65536,0.44556713104248047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,51200,0.350383996963501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,1536,0.034289777278900146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,7168,1024,0.04238311118549771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,7168,768,0.023002665903833177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,16384,0.11985333760579427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,12288,0.09035378032260472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,16384,0.23285155826144746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,51200,0.765685346391466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,12288,0.17470222049289277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,16384,0.29380978478325737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,10240,0.0892675585216946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,12288,0.22148444917466906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,8192,0.06904266940222846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,10240,0.14701422055562338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,10240,0.18681600358751085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,7168,0.0657600031958686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,8192,0.11929333209991455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,65536,1.1418942345513237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,8192,0.15426933765411377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,6144,0.055536889367633395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,5120,0.04382044408056471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,7168,0.13804622491200766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,6144,0.12168444527520074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,6144,0.09405510955386692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,4096,0.038047999143600464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,5120,0.08054133256276448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,5120,0.10604977607727051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,65536,0.9698844485812717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,3584,0.03322044346067641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,4096,0.0646488865216573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,3072,0.028784000211291846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,4096,0.08871377838982476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,2560,0.024663110574086506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,3584,0.0581644442346361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,3584,0.08132266336017184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,2048,0.02130399975511763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,3072,0.07376977470186022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,2560,0.06583555539449056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,1536,0.015492444237073263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,2048,0.038098666403028704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,1536,0.032037334309683904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,1536,0.04960888955328199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,1024,0.012372444073359171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,1024,0.02437155610985226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,1024,0.03939555419815911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,768,0.010709332923094431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,7168,0.10741244422064887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,51200,0.8995342254638672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,512,0.00867555538813273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,768,0.03513955407672458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,768,0.021669333179791767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,256,0.007308444215191736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,512,0.03281689021322463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,512,0.0188737776544359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,128,0.00656444455186526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,256,0.017217778497272067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,256,0.028093334701326158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,64,0.00628977765639623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,6144,32,0.006585777633719974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,128,0.025056888659795124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,128,0.01683288812637329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,64,0.016561778055297006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,3072,0.05078044533729553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,32,0.016200888488027785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,6144,2560,0.045258667733934194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,6144,2048,0.05632355478074816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,16384,0.1120106644100613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,65536,0.40406134393480087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,51200,0.32164978981018066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,12288,0.08652533425225152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,16384,0.2171351114908854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,10240,0.06910133361816406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,12288,0.1759208838144938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,16384,0.29156443807813853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,51200,0.7012115584479438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,65536,0.8967475891113281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,8192,0.05827555391523573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,10240,0.13381066587236193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,7168,0.04935822221967909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,8192,0.10988266600502862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,10240,0.19015288352966309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,8192,0.15266222423977321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,7168,0.09792444441053604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,7168,0.13721956147087946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,5120,0.03449511196878221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,6144,0.08694666624069214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,6144,0.12067822615305583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,4096,0.02919911013709174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,51200,0.8915849261813693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,5120,0.07374399900436401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,5120,0.10461066828833686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,3584,0.02754844393995073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,3072,0.02457422183619605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,4096,0.0889973309304979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,4096,0.05870933002895779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,3584,0.0811777777141995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,65536,1.1312630971272786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,2560,0.019457777341206867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,3072,0.07258488734563191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,2048,0.01665155589580536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,2560,0.04178933302561442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,2560,0.06489066945181952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,1536,0.013588444226317935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,2048,0.03529777791765001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,2048,0.05572266711129082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,12288,0.23307998975118002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,1024,0.010047111246320937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,1536,0.029492444462246362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,768,0.008718222379684448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,1536,0.048772444327672325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,1024,0.03804622093836466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,1024,0.02256444427702162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,512,0.0069644442862934535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,6144,0.04043644335534837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,768,0.03434044453832839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,256,0.005944889038801193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,512,0.01774044500456916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,512,0.030986666679382324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,128,0.005541333307822545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,256,0.027764444549878437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,256,0.01648977730009291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,64,0.005256888767083486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,5120,32,0.005221333354711533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,5120,128,0.024700444605615404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,128,0.015855110353893705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,64,0.015815999772813585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,32,0.015455999308162265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,3584,0.05283733208974203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,3072,0.04708622230423821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,65536,0.32802311579386395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,51200,0.25920534133911133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,16384,0.08941600057813857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,16384,0.20818755361768934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,65536,0.8043742179870605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,12288,0.06581244203779432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,51200,0.6345280011494955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,16384,0.2719208929273817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,5120,768,0.02040088839001126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,10240,0.05793155564202202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,8192,0.042747557163238525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,12288,0.1466719971762763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,10240,0.12415466043684219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,10240,0.16416445043351915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,7168,0.04045777850680881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,8192,0.09946578078799778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,8192,0.13662666744656032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,6144,0.03383288780848185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,7168,0.08919111225340103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,51200,0.7862844467163086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,7168,0.1241048839357164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,5120,0.02954044606950548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,65536,0.998194694519043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,4096,0.02461333407296075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,6144,0.10754933622148301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,6144,0.07844977908664279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,3584,0.022150221798155043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,5120,0.09405955341127183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,5120,0.06658222277959187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,3072,0.020270221763186984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,4096,0.07902577850553724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,4096,0.05368444323539734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,2560,0.01774488886197408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,3584,0.04790488878885905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,3584,0.07267289029227363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,2048,0.015233778291278414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,3072,0.06571911440955268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,3072,0.04286400145954556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,2560,0.0381368895371755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,2560,0.058873779243893094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,1536,0.01257155587275823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,1024,0.009753777749008602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,2048,0.03224622209866842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,2048,0.051220443513658315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,768,0.008459555606047312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,1536,0.04483822319242689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,1536,0.02680177821053399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,1024,0.020917332834667627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,512,0.006603555546866522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,1024,0.03526755505137973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,256,0.005724444571468566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,768,0.018911111685964797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,768,0.03258488906754388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,128,0.00519466648499171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,512,0.01683822274208069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,512,0.029545777373843726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,64,0.004596444467703502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,256,0.015805333852767944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,256,0.027458666099442378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,12288,0.19578044944339326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,4096,32,0.00488800017370118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,128,0.015312888556056552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,4096,128,0.024215110474162634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,64,0.015134221977657743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,4096,32,0.01514488955338796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,51200,0.2331991195678711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,65536,0.3064648840162489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,16384,0.08591822120878433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,16384,0.1924213303460015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,51200,0.6105448934766982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,12288,0.06518577867084079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,65536,0.7825146781073676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,10240,0.05415111117892795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,12288,0.14112888442145452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,12288,0.19630222850375703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,8192,0.042456888490253024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,10240,0.11865866184234619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,51200,0.779546684688992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,7168,0.038198222716649376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,8192,0.09804711076948379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,65536,0.9958284166124133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,6144,0.033927109506395124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,7168,0.12110755178663467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,7168,0.08736355437172784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,5120,0.029448890023761328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,6144,0.10716978046629165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,6144,0.07692088683446248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,4096,0.024417777856190998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,5120,0.06504888667000665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,5120,0.09316533141665989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,3584,0.0229093333085378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,4096,0.07856622007158068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,3072,0.019997333486874897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,3584,0.07238755623499553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,16384,0.25689244270324707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,2560,0.01761155492729611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,3072,0.04208799865510729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,3072,0.06571822033988105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,2048,0.015356444650226168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,2560,0.03728888763321771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,2048,0.03187377916442023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,2048,0.05096355411741468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,1536,0.012847999731699625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,10240,0.1636106703016493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,1024,0.009646221995353699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,8192,0.13636799653371176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,1536,0.044334222873051964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,1536,0.026165333059098985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,768,0.008309333688682979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,1024,0.020569778150982328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,1024,0.035162667433420815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,512,0.006656000183688269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,768,0.032159109910329185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,768,0.018572444717089336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,256,0.005600000007285013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,512,0.01616533266173469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,256,0.015465777781274585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,128,0.005223999834722943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,256,0.02658044464058346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,64,0.004610666798220741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,3584,0.04685599936379326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,128,0.024089778463045757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,128,0.014898666077189975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3584,32,0.0052826665341854095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,64,0.01480977733929952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,32,0.014430221584108142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,65536,0.2494373321533203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,2560,0.05832711193296644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,51200,0.21881066428290474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,16384,0.07324533330069648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,65536,0.7375306553310819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,16384,0.18518666426340738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,12288,0.052684442864524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,51200,0.5786506864759657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3584,512,0.029504001140594482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,10240,0.045887112617492676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3584,4096,0.052784889936447144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,12288,0.13668089442782932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,12288,0.19194932778676352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,8192,0.03746577766206529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,10240,0.1128773291905721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,7168,0.03209866748915778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,10240,0.16298222541809082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,51200,0.7795022328694662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,65536,0.9849270714653863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,8192,0.09325066539976333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,6144,0.028597331709331934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,8192,0.13510221905178493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,7168,0.08279377884334989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,7168,0.12070133950975205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,6144,0.10664444499545628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,4096,0.020629333125220407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,5120,0.061182220776875816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,3584,0.018395556343926322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,5120,0.09244266483518813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,3072,0.016618667377365958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,4096,0.049568000766966075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,4096,0.07821955283482869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,3584,0.07175822390450372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,3584,0.04458489020665487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,2560,0.01464355488618215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,2048,0.012800888882742988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,3072,0.040413333310021296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,3072,0.06475289000405206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,2560,0.05794399976730347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,2560,0.03569688730769687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,1536,0.010034666293197209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,2048,0.030517333083682593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,2048,0.04867022236188253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,1024,0.0076453329788313965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,1536,0.043603556023703686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,768,0.00655733338660664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,1024,0.019934222102165222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,16384,0.25496800740559894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,512,0.005879999862776862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,768,0.032229334115982056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,768,0.017910222212473553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,256,0.0052133335007561584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,512,0.015800888339678448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,512,0.02946044339074029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,5120,0.024546666277779475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,128,0.004223111189073986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,256,0.014768888552983602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,64,0.004201777693298128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,6144,0.07244088914659289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,128,0.023846222294701472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,3072,32,0.0041999999019834726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,128,0.0144533332851198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,64,0.014084445105658637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,32,0.014025777578353882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,65536,0.19061866071489122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,51200,0.18402932749854195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,3072,1536,0.02490666674243079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,1024,0.03528889020284017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,16384,0.05379822187953525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,65536,0.6946986516316732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,51200,0.5415973133511013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,12288,0.0439297788672977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,16384,0.17311733298831514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,10240,0.034747554196251765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,16384,0.2538702223036024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,12288,0.1268764469358656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,12288,0.1915688912073771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,3072,256,0.02604266670015123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,10240,0.10673689179950291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,10240,0.16211822297838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,7168,0.025087111526065405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,65536,0.9836062325371636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,8192,0.08816533618503147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,8192,0.13326756159464517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,51200,0.7816942003038195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,6144,0.023583999938435022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,5120,0.01973600023322635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,7168,0.07826933595869276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,7168,0.11947733826107448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,6144,0.06793955299589369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,4096,0.01601777805222405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,6144,0.10566311412387425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,5120,0.058127111858791776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,3584,0.01475644442770216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,5120,0.09217955668767293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,3072,0.013325333595275879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,4096,0.07755555709203084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,4096,0.04690577917628818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,2560,0.012311999996503195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,3584,0.04203200009134081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,3584,0.07159111234876844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,2048,0.010442666709423065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,3072,0.03775733378198411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,1536,0.008254222571849823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,3072,0.0648239983452691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,2560,0.057576000690460205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,2560,0.03300177719857957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,2048,0.04874577787187365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,1536,0.04195733202828301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,768,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,1536,0.023716444770495098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,1024,0.03492710987726847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,512,0.005199999858935674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,1024,0.01924533314175076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,256,0.004515555583768421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,768,0.03184266553984748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,768,0.017162667380438913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,512,0.029162665208180744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,128,0.0041582224269707995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,512,0.015493333339691162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,64,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,8192,0.02920177910063002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,256,0.025755556093321905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,256,0.014464888307783337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,32,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2560,128,0.02382755610677931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,128,0.014093332820468478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,64,0.01346933344999949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,32,0.013454222016864352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,65536,0.19782043827904594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,51200,0.14431733555263943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,16384,0.05108888943990072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,16384,0.16274489296807185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,12288,0.038402666648228966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,16384,0.21964444054497612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,51200,0.5107866923014323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,65536,0.6499048868815104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2560,1024,0.006934222247865465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2560,2048,0.027756444282001917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,12288,0.11924533049265544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,12288,0.16528799798753527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,8192,0.02457511093881395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,10240,0.09986755583021377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,51200,0.6666017638312446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,7168,0.021644444929228887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,10240,0.1407839987013075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,65536,0.8458035786946615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,8192,0.08196889029608832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,8192,0.11653155750698513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,5120,0.017320889565679762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,7168,0.10475999779171413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,7168,0.07322221994400024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,4096,0.014919110470347934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,6144,0.06348266866472033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,6144,0.09277866946326362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,5120,0.05289777782228258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,5120,0.0810862249798245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,4096,0.04372088776694404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,3072,0.012346666720178394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,3584,0.03992444607946608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,3584,0.0634488860766093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,2560,0.01070666644308302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,3072,0.03532355692651536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,3072,0.05716355641682943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,2048,0.009295110901196798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,2560,0.031714667876561485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,2560,0.05044000016318428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,10240,0.03209155466821458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,1536,0.007655999726719326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,2048,0.027091556125217017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,2048,0.04321066538492838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,1024,0.006228444476922353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,1536,0.038226667377683855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,1536,0.022653333014912073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,768,0.005601777798599667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,1024,0.03222222129503886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,512,0.004819555415047539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,6144,0.01975288821591271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,768,0.029496888319651287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,256,0.004171555654870139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,512,0.014952888091405233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,512,0.027093332674768236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,128,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,3584,0.013552889227867126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,256,0.025088000628683303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,64,0.003629333443111844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,128,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,128,0.022675555613305833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,2048,32,0.0035333335399627686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,64,0.013435555828942193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,65536,0.1468248897128635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,32,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,51200,0.12354311678144668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,1024,0.01824977828396691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,65536,0.6089830928378636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,768,0.016492444607946608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,16384,0.038831998904546104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,51200,0.4760577943589952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,12288,0.029418667157491047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,2048,256,0.013756444056828817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,16384,0.15403910477956137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,16384,0.21858844492170545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,12288,0.11179910765753852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,65536,0.8421902126736112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,8192,0.020277332928445604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,12288,0.16529866059621176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,10240,0.09386666615804036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,10240,0.13997244834899902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,7168,0.018010665973027546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,51200,0.6620320214165581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,8192,0.11603111690945095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,6144,0.016216889023780823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,7168,0.06838399834103055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,7168,0.10378844208187527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,5120,0.01423466702302297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,6144,0.09211555454466079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,6144,0.05917155742645264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,4096,0.012305777933862476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,5120,0.04986133178075155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,5120,0.08077066474490695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,3584,0.011076444553004371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,4096,0.041109333435694374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,4096,0.06821066803402372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,3072,0.010031110710567897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,3584,0.03705155518319871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,3584,0.06311644448174371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,2560,0.00922400007645289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,3072,0.03342933456103007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,2048,0.007963555554548899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,3072,0.055517332421408765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,1536,0.0069439998931354946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,2560,0.05084000031153361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,2560,0.030047112041049536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,10240,0.02426311042573717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,2048,0.04253244400024414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,2048,0.025047999289300706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,768,0.004975111120276981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,1536,0.021553777986102637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,1024,0.0319164428446028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,1024,0.017440888616773818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,512,0.004576888763242298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,768,0.015861334072219003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,768,0.029162665208180744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,8192,0.07655111286375257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,256,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,512,0.014418666561444601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,128,0.004062222109900581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,256,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,256,0.023706666297382776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,64,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,128,0.013085333009560903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,128,0.02163022259871165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,32,0.0039013334446483185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,64,0.012732444538010491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,65536,0.10719377464718288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1536,32,0.01274400038851632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,51200,0.08051288790173002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1536,1024,0.005535999933878581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,2048,4096,0.06913422213660346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,16384,0.03215822246339586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,1536,0.03803199860784743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,65536,0.5620906617906358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,12288,0.024541333317756653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,51200,0.44295377201504177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,16384,0.13821778032514784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,16384,0.21526755226982963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,10240,0.021129777034123737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,12288,0.10343644354078506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,12288,0.16161689493391249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,8192,0.017553778158293832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,65536,0.8264924685160319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,7168,0.016410667035314772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,10240,0.08690310849083795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,10240,0.13727200031280518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,6144,0.014083556003040738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,51200,0.6508408652411567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,8192,0.07110577821731567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,5120,0.012277333272827996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,7168,0.06297777758704291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,7168,0.10244977474212646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,4096,0.010584889186753167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,6144,0.05372711022694906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,5120,0.04591022266281975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,5120,0.07903110980987549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,3584,0.009650666680600908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,4096,0.037667555941475764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,3072,0.008665777742862701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,3584,0.06227022409439087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,3584,0.033935109774271645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,2560,0.008001777860853408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,3072,0.030513776673210993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,3072,0.05625155236985949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,2048,0.006934222247865465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,2560,0.027310222387313843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,2560,0.049089776145087353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,1536,0.006462222172154321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1536,512,0.0273973329199685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,2048,0.023316444622145757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,2048,0.04234133495224846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,1024,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,1536,0.0377111103799608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,1536,0.020304888486862183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,768,0.004571555389298333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,1024,0.016544888416926067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,1024,0.03162399927775065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,512,0.003944000022278892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,8192,0.11419378386603461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,768,0.028813332319259644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,256,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,512,0.013776889277829064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,512,0.026957333087921143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,128,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,6144,0.09025688966115315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,256,0.024745777249336243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,256,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,64,0.0032248888164758682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,1024,32,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,128,0.012453333371215396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,128,0.02144355575243632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,1024,4096,0.06700888607237074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,64,0.012233778006500669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,65536,0.08902400069766575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,32,0.012453333371215396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,51200,0.07055289215511747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,16384,0.14116622342003718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,51200,0.4382755491468642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,12288,0.019885333047972787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,16384,0.21412711673312715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,51200,0.6475520133972168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,12288,0.10235644711388482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,65536,0.823069307539198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,1024,768,0.015277332729763456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,8192,0.014564444621404013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,12288,0.16092711024814182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,7168,0.013376889129479727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,10240,0.08632444673114353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,10240,0.13716533448961046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,8192,0.07140977515114678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,6144,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,8192,0.11356000105539958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,7168,0.06217866473727756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,7168,0.10241511132982041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,5120,0.010336000058386061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,6144,0.053293334113227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,16384,0.02609511050913069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,6144,0.09013866715961033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,4096,0.009031111167536842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,3584,0.008078222473462423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,5120,0.045087112320793994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,5120,0.07857600185606214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,4096,0.06750400198830499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,4096,0.03706577751371596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,3072,0.007626666790909237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,3584,0.03327466713057624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,2560,0.006903999795516332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,65536,0.5580595334370931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,2048,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,3072,0.05602577659818861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,3072,0.03120533294147915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,2560,0.048400001393424145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,2560,0.02700000007947286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,1536,0.005571555760171678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,1024,0.004588444613748127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,2048,0.02366311185889774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,2048,0.042266666889190674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,1536,0.03735377722316318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,1536,0.020071999894248117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,10240,0.017129777206314933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,512,0.003871110992299186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,1024,0.016534222496880423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,1024,0.031290666924582586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,256,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,768,0.014833778142929077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,512,0.013803555733627744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,512,0.026748443643252056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,128,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,256,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,256,0.023299554983774822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,64,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,128,0.022272888157102797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,128,0.012764444781674279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,32,0.003564444267087512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,64,0.012103999654452005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,65536,0.05620888868967692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,768,32,0.012426666915416718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,51200,0.04566577739185757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,3584,0.06015021933449639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,16384,0.019159111711714003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,65536,0.5171884430779351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,51200,0.4063093397352431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,12288,0.018358222312397428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,768,768,0.004519111166397731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,16384,0.21354311042361787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,51200,0.6457582049899632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,768,768,0.028757333755493164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,10240,0.01660977800687154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,12288,0.09519200192557441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,65536,0.8191786872016059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,8192,0.0141004439857271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,7168,0.012687111066447364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,12288,0.1608862214618259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,10240,0.07934755749172635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,10240,0.13607111242082384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,6144,0.011065777805116443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,8192,0.06482666730880737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,8192,0.11329066753387451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,7168,0.05705066521962484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,7168,0.1017377773920695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,4096,0.008288000192907121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,6144,0.04851999878883362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,5120,0.04095200035307143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,3584,0.007734222544564142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,5120,0.07850755585564508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,4096,0.03496799866358439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,4096,0.06501244174109565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,3584,0.060602664947509766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,3584,0.030889779329299927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,2560,0.006567111031876669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,3072,0.028301331732008193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,3072,0.05409511261516147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,2048,0.0059075554211934405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,2560,0.048001776138941445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,2560,0.025303999582926433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,1536,0.005200888961553574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,2048,0.04208533300293816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,1024,0.004520888957712385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,16384,0.1294728914896647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,1536,0.01888799998495314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,1536,0.03719733489884271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,768,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,1024,0.01587733295228746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,1024,0.03114933437771267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,512,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,768,0.014526221487257214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,768,0.028379556205537584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,256,0.0033200000309281876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,512,0.013350221845838757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,512,0.026564444104830425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,128,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,256,0.01237155579858356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,256,0.02313066687848833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,5120,0.010042666561073726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,64,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,32,0.003142222141226133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,128,0.02074044446150462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,128,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,64,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,65536,0.037696888049443565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,512,3072,0.007080000307824876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,51200,0.030870222383075293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,2048,0.021947556071811255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,65536,0.516159110599094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,51200,0.4055662155151367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,16384,0.014194667339324951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,12288,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,51200,0.6424213515387641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,16384,0.13060355186462402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,65536,0.8140177726745605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,12288,0.0939297808541192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,10240,0.012847111456924014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,8192,0.013066666821638743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,12288,0.16036178006066218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,10240,0.07856444517771403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,10240,0.13612355126274958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,8192,0.06397866540484957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,512,6144,0.08980266915427314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,6144,0.010627555350462595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,8192,0.11260710822211371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,512,32,0.011761777930789523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,7168,0.05605777766969469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,5120,0.0094373333785269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,7168,0.1019173330730862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,4096,0.007983110845088959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,6144,0.048115554783079356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,6144,0.08876266744401719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,3584,0.007634667058785756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,5120,0.07802310917112562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,4096,0.03468177715937296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,4096,0.06486311223771837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,3072,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,3584,0.06102933486302694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,3584,0.030814223819308813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,2560,0.006280000011126201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,3072,0.027822222974565294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,3072,0.053759998745388456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,2048,0.00555288874440723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,2560,0.02518400053183238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,2560,0.0481608874268002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,1536,0.004867555366622077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,2048,0.02199111051029629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,2048,0.041801777150895864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,16384,0.212865776485867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,1024,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,768,0.003825777934657203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,1536,0.01885955532391866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,1536,0.037091556522581316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,512,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,1024,0.015513777732849121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,768,0.028455999162462022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,256,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,7168,0.011795555551846823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,512,0.012855999999576144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,512,0.02570399973127577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,128,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,256,0.024340444140964087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,256,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,128,0.020576000213623047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,128,0.011748444702890186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,256,32,0.0028799999919202593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,65536,0.030245333909988403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,64,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,5120,0.04052088989151849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,32,0.011762667033407422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,51200,0.02346755564212799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,16384,0.011010666688283285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,16384,0.1286835538016425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,65536,0.5148968696594238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,51200,0.40482576688130695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,12288,0.012437333663304647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,16384,0.21217689249250624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,51200,0.640635543399387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,12288,0.09363910886976455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,256,1024,0.03117777903874715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,10240,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,65536,0.8143119812011719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,12288,0.15993689166174993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,256,768,0.014482667048772177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,8192,0.01038755559258991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,7168,0.009672000176376766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,6144,0.008991999758614434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,10240,0.07819466458426581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,10240,0.13595733377668592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,8192,0.06265333626005384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,8192,0.1122631099489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,7168,0.05589510997136434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,7168,0.10117510954538982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,5120,0.008350222474998897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,6144,0.04795911245875888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,4096,0.007608888877762689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,6144,0.08881333139207627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,5120,0.04004888733228048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,5120,0.07573155562082927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,4096,0.033518221643235944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,3072,0.00658044425977601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,4096,0.06393955813513862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,2560,0.005889777921968036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,3584,0.030809776650534734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,3584,0.059267554018232554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,2048,0.005551110953092575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,2560,0.025049777494536504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,2560,0.048151999711990356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,1536,0.004589333302444882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,2048,0.021964444054497614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,1024,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,1536,0.037083556254704796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,1024,0.015491555134455362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,768,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,1024,0.03119200136926439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,768,0.028453333510292902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,768,0.014459555347760519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,512,0.01275644451379776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,512,0.026173333326975506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,256,0.0031999999450312722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,3584,0.006968888971540663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,128,0.0029093333416514923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,256,0.012395555774370829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,128,0.011764444410800934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,128,0.020936000678274367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,64,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,128,32,0.002924444360865487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,64,0.011698666546079846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,32,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,2048,0.041365332073635526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,51200,0.025590222742822435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,1536,0.01891911029815674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,16384,0.009707555174827576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,16384,0.13025066587660047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,12288,0.008647110727098253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,51200,0.40508177545335555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,65536,0.5150160259670681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,10240,0.00903733323017756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,8192,0.008240888516108194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,12288,0.09364622169070774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,7168,0.007987555530336168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,10240,0.07824711004892985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,256,0.023315555519527856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,6144,0.007617777420414819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,8192,0.0630542238553365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,5120,0.007663999994595845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,4096,0.007260444263617198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,128,3072,0.02780088782310486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,7168,0.05513866742451986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,3584,0.006940444310506185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,5120,0.039099554220835366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,3072,0.006309333360857434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,4096,0.03338755501641168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,3584,0.030576000610987347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,65536,0.03131644593344794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,2048,0.005245333330498801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,3072,0.02776177724202474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,1536,0.004519111166397731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,1024,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,2560,0.02506133251720005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,768,0.0035208890007601846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,2048,0.021777777208222285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,512,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,1536,0.01891999940077464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,1024,0.01550044450494978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,768,0.0144213338692983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,128,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,512,0.013101333545313941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,64,0.002549333290921317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,256,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,32,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,128,0.011687111523416309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,64,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,65536,0.02663822140958574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,32,0.011408000356621213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,51200,0.020455110404226515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,16384,0.01202222208182017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,1024,128,3072,0.05323733223809136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,16384,0.1299066676033868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,64,6144,0.04590310984187656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,10240,0.009690666364298927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,2560,0.0057848890622456866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,51200,0.4046657880147298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,8192,0.00902133352226681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,65536,0.5151217778523763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,7168,0.008799110849698385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,6144,0.008350222474998897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,12288,0.09280088875028823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,5120,0.007619555625650618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,10240,0.07738577657275729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,8192,0.06304355462392171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,4096,0.007599111232492659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,7168,0.05520711011356778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,3584,0.0069297779765393995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,6144,0.046859555774264865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,3072,0.0063440000845326324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,5120,0.039114667309655085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,2560,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,64,256,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,4096,0.03357244531313578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,3584,0.03053955568207635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,2048,0.00589155571328269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,1536,0.004918222212129169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,3072,0.027671999401516382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,2560,0.025029333101378545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,2048,0.021822222405009802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,1536,0.018922666708628338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,512,0.003192000091075897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,1024,0.015458666616015963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,256,0.0031884445084465873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,128,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,768,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,64,0.002534222271707323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,256,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,32,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,128,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,64,0.01146755533085929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,32,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,12288,0.010391111175219217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,1024,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1024,32,768,0.003588444242874781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1024,32,512,0.013125333521101209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,16384,1.045072873433431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,16384,1.1864293416341145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,12288,0.7263324525621203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,10240,0.5589555634392632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,12288,0.8577795558505588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,8192,0.457289801703559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,10240,0.7960089047749838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,7168,0.4496595594618056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,8192,0.6148595809936523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,6144,0.3903848859998915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,7168,0.4945155779520671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,5120,0.2874915599822998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,4096,0.2540506786770291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,6144,0.42749423450893825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,3584,0.20906399355994332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,5120,0.44249688254462344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,3072,0.19605067041185167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,2560,0.15356889035966662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,3072,0.21705688370598686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,3584,0.2572400040096707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,51200,3.1525671217176647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,1536,0.10075466500388251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,2560,0.19035644001430937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,1024,0.07667111025916205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,768,0.05413600140147739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,2048,0.15591911474863687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,1536,0.1225022210015191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,512,0.04058666692839728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,256,0.03232977787653605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,1024,0.09432355562845866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,128,0.02624888883696662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,512,0.06865866978963216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,256,0.062422222561306424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,128,0.05838844511244032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,32,0.023018666439586218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,768,0.08308800061543782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,64,0.058561775419447154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,32,0.05766666597790188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,51200,4.057139502631293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,65536,4096,0.30285244517856175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,2048,0.1222684383392334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,65536,64,0.022308443983395893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,16384,0.7770506540934244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,12288,0.5670808686150445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,16384,0.9368907080756294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,10240,0.5054142210218642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,12288,0.6845813327365451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,8192,0.3693671226501465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,10240,0.6038239796956381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,7168,0.33982666333516437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,6144,0.2867475615607368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,8192,0.5232533348931206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,7168,0.4178026782141791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,5120,0.22652800877888998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,51200,2.6072639889187283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,4096,0.18385777208540174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,6144,0.3809066613515218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,5120,0.2939564387003581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,3584,0.17992356088426378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,3072,0.1409440040588379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,4096,0.27362312210930717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,2560,0.12591555383470324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,3584,0.20503200425042045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,3072,0.17602133750915527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,2048,0.10611733463075425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,65536,3.3578052520751953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,1536,0.07763289080725776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,1024,0.05759466356701321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,2560,0.1561608844333225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,768,0.042985777060190834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,1536,0.0999164448844062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,51200,3.209443622165256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,512,0.03375377919938829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,1024,0.08852710988786484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,256,0.026503110925356548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,128,0.02436711059676276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,64,0.020679111282030743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,512,0.05648089117474026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,256,0.05278133352597555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,2048,0.13180088996887207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,128,0.048192888498306274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,51200,32,0.023012444376945496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,64,0.04931733343336317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,32,0.048511111074023776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,65536,4.07228257921007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,16384,0.27918932172987193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,12288,0.2063973347345988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,51200,0.7506702211168078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,65536,1.0245591269599068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,10240,0.17839554945627847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,51200,768,0.06628888845443726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,12288,0.2911013232337104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,51200,1.1523653666178386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,7168,0.12861066394382054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,8192,0.147070222430759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,8192,0.17419732941521537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,10240,0.22823378774854872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,6144,0.10581333107418484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,65536,1.4672613143920898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,5120,0.08380444182289971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,4096,0.07059022453096178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,7168,0.1543955538007948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,3584,0.06010044283337063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,6144,0.15386845005883112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,3072,0.05288266804483202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,5120,0.11960355440775554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,4096,0.09497333235210842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,2560,0.0543066660563151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,2048,0.04495733314090305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,3584,0.08779466814464992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,1536,0.03489066825972663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,1024,0.025058666865030926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,768,0.019665777683258057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,1024,0.03532177872127957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,16384,0.34294488694932723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,1536,0.04382933179537455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,512,0.01521511044767168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,768,0.02977777851952447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,256,0.01110311100880305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,2048,0.054720001088248364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,512,0.025425778494940862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,2560,0.06488177511427137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,256,0.023008000519540574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,64,0.008962666822804345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,128,0.022403554783927068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,64,0.02232088810867733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,32,0.021956443786621094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,16384,3072,0.07400088840060763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,51200,0.5799671279059516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,65536,0.7529902458190918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,16384,0.18408800495995414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,12288,0.16933688852522108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,128,0.01036711119943195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,51200,0.926346672905816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,16384,0.303422212600708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,16384,32,0.00903733323017756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,65536,1.192488882276747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,12288,0.208116438653734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,8192,0.097634666495853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,7168,0.08800533082750107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,6144,0.07453866799672444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,10240,0.17535111639234754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,8192,0.1474835607740614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,7168,0.1259982188542684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,4096,0.05487289031346639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,6144,0.10993422402275933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,3584,0.04897866646448771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,3072,0.04047377904256185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,2560,0.034246222840415105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,4096,0.0814631117714776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,3584,0.07107110818227132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,2048,0.02915466825167338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,3072,0.060601777500576444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,1536,0.02348711093266805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,1024,0.01753866672515869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,2560,0.05351110961702135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,768,0.015027556154463025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,2048,0.04491555690765381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,512,0.011810666984981961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,256,0.008904000123341879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,1024,0.029639999071757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,1536,0.03727022144529555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,768,0.0258577780591117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,128,0.007613333563009898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,512,0.022269333402315777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,64,0.007585778004593319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,256,0.020261334048377145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,128,0.019887111253208585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,64,0.01957066688272688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,10240,0.12421866257985432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,32,0.01921688848071628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,5120,0.06156444549560547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,51200,0.5052364667256674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,16384,0.15677332878112793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,65536,0.6117022302415636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,12288,0.12308355172475179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,10240,0.09448711077372234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,51200,0.8223182360331217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,16384,0.2607395648956299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,12288,0.2056746615303887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,65536,1.0530462265014648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,7168,0.07720266448126899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,10240,0.1567795541551378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,6144,0.06049066781997681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,8192,0.1292639970779419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,5120,0.05054488778114319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,7168,0.11286489168802898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,4096,0.04228711128234863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,6144,0.09956622123718262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,5120,0.0859759979777866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,3584,0.039275556802749634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,3072,0.034663110971450806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,4096,0.07133511039945814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,2560,0.03061422374513414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,3584,0.06469688812891643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,2048,0.024360888534122046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,3072,0.05604444609747993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,1536,0.019778667224778067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,12288,5120,0.0948080023129781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,2560,0.047854221529430814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,768,0.012127111355463663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,1536,0.033612443341149226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,512,0.010032888915803697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,1024,0.027012444204754297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,256,0.007190222541491191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,768,0.02330222229162852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,128,0.006582222051090664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,512,0.020280000236299302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,64,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,256,0.01889155473974016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,32,0.005959110955397288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,128,0.018583110637134977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,8192,0.08963911400900947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,64,0.018219555417696636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,12288,32,0.007660444411966536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,32,0.017982222967677645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,16384,0.1307093302408854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,65536,0.4697679943508572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,51200,0.4046666622161865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,16384,0.21569155322180855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,12288,0.1045431097348531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,10240,1024,0.014863111906581454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,10240,0.08323733011881511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,10240,2048,0.04123555620511373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,12288,0.18569510512881807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,51200,0.7120141983032227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,7168,0.05729689200719198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,10240,0.1432622273763021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,6144,0.054273777537875705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,65536,0.9053244060940213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,5120,0.04530488782458835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,8192,0.11304799715677898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,4096,0.03673333260748122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,7168,0.10385777552922566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,3584,0.03239377670817905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,6144,0.08830666542053223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,3072,0.03040800160831875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,5120,0.07525600327385797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,2560,0.02568000058333079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,4096,0.06470044453938802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,2048,0.02198133369286855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,3584,0.05627999703089396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,1536,0.018441778090265062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,3072,0.048700445228152804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,1024,0.014411555396185981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,2560,0.04422044422891405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,768,0.0118568887313207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,2048,0.03724711139996847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,512,0.009313777916961247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,256,0.006426666759782367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,1536,0.030301332473754883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,128,0.006401777681377199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,768,0.021722666091389124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,64,0.005884444548024072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,512,0.018889778190188937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,32,0.006226666685607698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,256,0.018178666631380718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,128,0.01715377800994449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,64,0.017158221867349412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,32,0.016511999898486666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,16384,0.11099466350343491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,65536,0.4024657673305935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,8192,8192,0.06937155458662245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,12288,0.08124533626768324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,10240,0.07874844471613567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,8192,0.0657786660724216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,12288,0.15018844604492188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,7168,0.05524177683724297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,10240,0.13446488645341662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,51200,0.6538169119093153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,65536,0.8306124475267199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,6144,0.04162844353251987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,8192,0.10417866706848145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,5120,0.035974221097098455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,4096,0.030392888519499037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,7168,0.09297866953743829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,6144,0.0817013316684299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,8192,1024,0.0243857784403695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,3584,0.028075555960337322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,3072,0.0247662216424942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,5120,0.06874489121966891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,2560,0.02108088963561588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,4096,0.05740266376071506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,3584,0.0506897767384847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,2048,0.01793955597612593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,1536,0.015233778291278414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,3072,0.04483555422888862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,1024,0.011424000064531961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,2560,0.039868444204330444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,768,0.00909511082702213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,512,0.007292444507280986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,1536,0.028347555134031508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,1024,0.022666666242811415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,768,0.020303999384244282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,128,0.0052577778697013855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,512,0.018255111243989732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,51200,0.3621848954094781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,64,0.004906666775544484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,256,0.01688799924320645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,32,0.005230222311284807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,128,0.016473778420024447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,64,0.016137777103318107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,32,0.015986666083335876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,65536,0.3842497666676839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,51200,0.3193262153201633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,16384,0.10709066523445977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,12288,0.08228800031873915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,16384,0.18526132901509604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,51200,0.5968337588840061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,10240,0.06345333655675252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,65536,0.7594213485717773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,8192,0.052367998494042285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,12288,0.15072888798183864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,7168,256,0.006156444549560547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,7168,0.04665333363744947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,6144,0.04074577821625604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,10240,0.11812355783250596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,8192,0.09747288624445598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,5120,0.035507556464936994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,4096,0.02699377801683214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,7168,0.08993777963850234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,6144,0.07842489083607991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,3584,0.024309333827760484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,16384,0.19891466034783256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,3072,0.021800888909233943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,5120,0.06400533517201741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,4096,0.0535768899652693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,2560,0.01864888932969835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,2048,0.01568000018596649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,1536,0.013348444468445249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,3072,0.04235555397139656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,1024,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,768,0.009328888522254096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,2048,0.03286400106218126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,1536,0.026536888546413843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,512,0.007582222421964009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,256,0.005934222290913264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,1024,0.021320889393488567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,768,0.01944533321592543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,128,0.005208000126812193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,64,0.005201777650250329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,512,0.017264889346228707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,256,0.016354666815863717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,6144,32,0.005215999980767568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,128,0.01583377851380242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,64,0.015487111277050443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,32,0.015466666883892484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,7168,2048,0.034985777404573225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,65536,0.31415732701619464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,51200,0.28294311629401314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,16384,0.08601422442330255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,12288,0.07222044467926025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,10240,0.06262133518854777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,16384,0.1704124477174547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,12288,0.12895911269717747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,8192,0.04405688908365038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,51200,0.55458312564426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,65536,0.70797332127889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,7168,0.03670488794644674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,10240,0.13043288389841715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,2560,0.03866844375928243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,6144,0.0351822210682763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,8192,0.09094311131371392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,5120,0.03186666634347703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,4096,0.02415200074513753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,3584,0.023222222924232483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,7168,0.08101955387327406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,6144,0.07152444124221802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,5120,0.05846044752332899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,4096,0.04899200134807163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,3584,0.04495199852519565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,2048,0.014930667148696052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,3072,0.03970400161213345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,1536,0.01276622215906779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,2560,0.0354364448123508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,1024,0.009115555220180089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,768,0.007947555846638149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,1536,0.024863110648261175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,512,0.006436444405052397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,1024,0.020240000552601285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,256,0.005561777700980504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,768,0.018304889400800068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,128,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,512,0.016844444804721408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,64,0.004221333397759331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,256,0.015606222881211175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,32,0.004576888763242298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,128,0.015126221709781222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,64,0.01510933372709486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,32,0.01479200025399526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,6144,3584,0.04961155520545112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,65536,0.28498133023579914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,51200,0.22300532129075792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,16384,0.0738568902015686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,2560,0.01739377776781718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,12288,0.0580693350897895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,10240,0.04901777704556783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,16384,0.15164177947574192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,51200,0.49400175942315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,12288,0.11579644680023193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,5120,2048,0.030699554416868422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,8192,0.038146668010287814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,7168,0.032991111278533936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,6144,0.02932000160217285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,10240,0.10123644272486369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,5120,0.024749333659807842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,8192,0.08168711264928182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,4096,0.020941333638297185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,7168,0.0726791090435452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,3584,0.01890222231547038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,5120,0.053695112466812134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,3072,0.016911110944218107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,6144,0.06283999813927545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,2560,0.014769777655601501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,4096,0.04438933398988512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,2048,0.01276533305644989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,1536,0.010956444674068026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,3072,0.03628177775277032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,2560,0.03208177619510227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,1024,0.00833511104186376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,2048,0.028391109572516546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,768,0.007259555160999298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,1536,0.022683555881182354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,512,0.006568000134494569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,256,0.005261333452330695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,1024,0.01900888813866509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,768,0.017522666189405654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,128,0.004862222406599256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,64,0.0042275554604000514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,5120,3072,0.020968000094095867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,256,0.01511111193233066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,4096,32,0.004247111164861255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,128,0.014833778142929077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,64,0.014177777700954013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,32,0.014145778285132514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,65536,0.6374737951490614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,51200,0.17822844452328154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,16384,0.06080177757475111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,12288,0.04244977898067898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,16384,0.14265688260396323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,65536,0.5980986489189996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,51200,0.46804353925916886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,12288,0.10818044344584148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,8192,0.03184266553984748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,7168,0.027631110615200464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,10240,0.09256355630026923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,8192,0.07658666372299194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,6144,0.025872000389628943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,7168,0.06799911128150092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,5120,0.021905778182877436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,512,0.015787555111779105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,4096,0.017861333158281114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,3584,0.016040888097551134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,6144,0.05916711356904772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,3072,0.014703111516104804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,5120,0.049752000305387706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,4096,0.04157511062092251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,2560,0.012879999975363413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,2048,0.011399110986126794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,3072,0.03408177693684896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,65536,0.2482337686750624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,2048,0.026562665899594624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,1024,0.007263110743628607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,1536,0.021518222159809534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,768,0.006258666515350342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,1024,0.018183999591403537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,512,0.0052986666560173035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,10240,0.038591110044055514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,4096,3584,0.04089511103100247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,768,0.016574222180578444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,256,0.00453333349691497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,128,0.0038977778620190094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,512,0.015136889285511441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,64,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,256,0.014825777875052558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,128,0.014093332820468478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,64,0.013777777552604675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,32,0.013784888717863293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,65536,0.24663199318779838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,3584,0.038527111212412514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,16384,0.0646159980032179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,1536,0.00926755534278022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,12288,0.049359109666612416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,65536,0.5760782029893663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,10240,0.04160711169242859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,16384,0.13985599411858454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,51200,0.46066845787896055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,8192,0.033547557062572904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,12288,0.10646044545703465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,7168,0.0296382208665212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,6144,0.0251866661840015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,10240,0.09126933415730794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,8192,0.07715466949674818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,5120,0.021517333057191636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,7168,0.06653510861926608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,4096,0.018351111147138808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,3584,0.01651822196112739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,6144,0.057526224189334445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3584,32,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,5120,0.04845066534148323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,3072,0.014843554960356818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,2560,0.012999110751681857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,4096,0.04117688867780898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,2048,0.011061333119869232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,3584,0.03780000077353583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,3072,0.03374400072627597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,2560,0.02974489000108507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,2048,0.026038222842746313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,768,0.0062773335311147906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,1536,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,51200,0.19177867306603325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,1024,0.017934223016103108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,512,0.005892444401979446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,256,0.004888888862397936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,768,0.016528000434239704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,128,0.004551110996140374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,64,0.004081777814361784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,512,0.015132443772421943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,256,0.014104000396198697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,32,0.0041866666740841335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,128,0.013798221945762634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,64,0.013797333670987023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3072,32,0.013399110900031196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,65536,0.18739467196994355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,51200,0.13877511024475098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,16384,0.0495760010348426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,12288,0.03718311256832547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,16384,0.12976355022854275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,10240,0.029667556285858154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,51200,0.42166932423909503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,8192,0.02520977788501316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,1536,0.009014222357008193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,7168,0.02203111184967889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,3072,1024,0.00692622239391009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,10240,0.08464977476331924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,6144,0.01924977699915568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,8192,0.06901688708199395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,5120,0.01682933337158627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,4096,0.014760888285107084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,7168,0.06141422192255656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,6144,0.053415109713872276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,3584,0.013472889032628802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,3584,2560,0.03047555685043335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,3072,0.012270222107569376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,5120,0.04518489042917887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,2560,0.01074488874938753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,4096,0.03861600160598755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,2048,0.009493333597977957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,1536,0.007659555309348636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,3584,0.035465776920318604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,1024,0.00628266649113761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,2560,0.027296889159414504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,2048,0.02405511173937056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,768,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,1536,0.020283554991086323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,512,0.004922666483455234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,1024,0.017200888858901132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,768,0.016172443826993305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,512,0.014759999182489185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,256,0.013904000322024027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,64,0.0035342222286595237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,128,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,12288,0.09919822216033936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,32,0.003548444559176763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,65536,0.536669307284885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,64,0.013451555536852943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,32,0.012905778156386482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,65536,0.17922133869595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,51200,0.13580532868703207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,16384,0.04637155599064297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,12288,0.034090667963027954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,16384,0.11992711491054958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,12288,0.09178311294979519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,10240,0.028943998946083918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,65536,0.49875466028849286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,51200,0.38940800560845273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,8192,0.024125332633654278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2560,3072,0.0310444434483846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,7168,0.021942221456103857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,6144,0.01924711134698656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,10240,0.07817866404851277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,5120,0.016759110821617972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,7168,0.056531555122799344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,256,0.004176889028814104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,4096,0.01423822177780999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,6144,0.049117333359188504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,3584,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,3072,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,5120,0.04207288887765673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2560,128,0.003624000069167879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,2560,0.01038577738735411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,4096,0.035692443450291954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,1536,0.007603555917739868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,2560,0.02536444365978241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,2048,0.02251111136542426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,1024,0.006230222268237009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,768,0.005544888890451855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,1536,0.018952889574898612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,512,0.004895110925038655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,1024,0.016701334052615695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,256,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,768,0.01516888870133294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,128,0.0035742223262786865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,512,0.014095111025704278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,64,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,256,0.01348977784315745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,32,0.0035333335399627686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,128,0.01311288856797748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,64,0.012732444538010491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,32,0.01290933373901579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,51200,0.10173333353466457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,8192,0.06390844451056586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,16384,0.03369066781467862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,2048,2048,0.0092622223827574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,65536,0.4868684344821506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,12288,0.02553244431813558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,3072,0.02885066800647312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,16384,0.1188817818959554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,10240,0.021599110629823472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,51200,0.3827066686418321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,8192,0.020419556233617995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,7168,0.01867288847764333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,6144,0.0166302224000295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,10240,0.07681244611740112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,8192,0.0626151098145379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,5120,0.014765333798196582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,7168,0.05511733227305942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,4096,0.012695999609099494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,3584,0.011350221931934357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,6144,0.048263112703959145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,5120,0.041305777099397444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,3072,0.010016000105275048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,4096,0.03466755482885573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,2560,0.009283555878533257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,2048,0.007627555893527136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,3584,0.03196000059445699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,1536,0.006728888799746831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,3072,0.02809422214825948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,1024,0.005566222386227713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,2560,0.025084444218211707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,2048,0.022776888476477727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,768,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,512,0.004335111214054955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,1536,0.018896889355447557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,256,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,1024,0.016190222567982145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,128,0.0033031110134389666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,768,0.015135111080275642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,512,0.013968000809351603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,256,0.013088888592190213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,32,0.0033119999700122406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,128,0.013017777767446307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,64,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,2048,3584,0.0325288905037774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,32,0.01239733315176434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,65536,0.09467555416954888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,51200,0.07547110981411405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,16384,0.029391109943389893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,12288,0.026347556047969397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,10240,0.02274311085542043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1536,12288,0.09127822187211777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,16384,0.10876711209615071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,8192,0.01925244430700938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,12288,0.08261866701973809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,7168,0.017210667332013447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,51200,0.34879644711812335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,65536,0.44416001107957626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,10240,0.07050844695832995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,6144,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,5120,0.012079111403889127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,8192,0.0565297802289327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,4096,0.011391110718250275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,3584,0.009663999908500248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,7168,0.05068177647060818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,6144,0.0438435541258918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,3072,0.009138666921191746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,5120,0.03750755720668369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,2560,0.008292444050312042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,2048,0.007304000357786815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,3584,0.029462221595976088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,1536,0.00598933340774642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,3072,0.025800888737042744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,2560,0.023346667488416035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,1024,0.00553688903649648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,2048,0.020626667473051283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,768,0.00453599997692638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,512,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,64,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,1536,0.017889777819315594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,1024,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,256,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,128,0.003519999898142285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,64,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,512,0.013448889056841532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,256,0.012776888906955719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,128,0.012453333371215396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,64,0.012410666379663678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,65536,0.06615999672147962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,32,0.012074666718641916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,51200,0.05275200141800774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,16384,0.023294222023752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,16384,0.10739377472135757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,51200,0.34676800833808047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,65536,0.44036089049445254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,12288,0.01962577799956004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,4096,0.03171644608179728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,10240,0.018054222067197163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,8192,0.015169777803950839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1536,65536,0.13252088758680555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,7168,0.013454222016864352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,12288,0.08146578073501587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,10240,0.06905777586830987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,6144,0.012084444363911947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,8192,0.055697778860727944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,4096,0.009296889106432596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,7168,0.04862133330769009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,6144,0.042698668109046094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,3584,0.007989333735571967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,5120,0.036686221758524575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,3072,0.007313778003056844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,1024,768,0.01424533294306861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,2560,0.006606222026877933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,4096,0.03149244520399306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,2048,0.006191111273235745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,1024,32,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,1536,0.0052328887912962176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,3584,0.028991109795040552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,3072,0.025751110580232408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,1024,0.004550222307443619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,768,0.0041991112132867174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,2560,0.02331111166212294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,2048,0.020783111453056335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,1536,0.01752622259987725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,1024,0.015138667490747241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,512,0.01311466677321328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,128,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,64,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,256,0.012511110968059964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,32,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,128,0.012064889073371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,64,0.012033777932325998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,65536,0.046839111381106906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,32,0.011865778101815118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,51200,0.03836799992455377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,16384,0.01800622211562263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,16384,0.09746133618884617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,51200,0.3167840109931098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,10240,0.015555555621782938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,12288,0.07345244619581434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,8192,0.015837333268589444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,512,0.003568888952334722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,256,0.0034773333205117118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,10240,0.06252621942096286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,7168,0.012888000243239932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,768,768,0.014096889230940076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,6144,0.01069155583779017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,8192,0.05026577909787496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,5120,0.009527111219035255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,4096,0.008279110822412703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,3584,0.0075911109646161394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,6144,0.03929422299067179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,5120,0.03334133492575751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,3072,0.0069413334131240845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,4096,0.028515554136700098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,2560,0.006587555425034628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,2048,0.00555644432703654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,3584,0.026594666971100703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,1536,0.005106666849719154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,3072,0.02367111047108968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,2560,0.021664000219768945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,1024,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,2048,0.019335110982259113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,768,0.004206222378545337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,1536,0.016662221815851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,512,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,1024,0.014562666416168213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,768,5120,0.01071200023094813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,256,0.0032071111102898917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,768,0.013764444324705334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,128,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,12288,0.017056889004177518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,64,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,512,0.01278222186697854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,512,32,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,256,0.012542222109105853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,65536,0.03088444471359253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,64,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,51200,0.028809779220157202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,16384,0.012607110871209038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,16384,0.09644799762301975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,51200,0.31551822026570636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,65536,0.4003102249569363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,7168,0.04518666532304552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,10240,0.011422221859296164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,8192,0.010025777750545079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,12288,0.07328710953394572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,10240,0.06177155839072334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,7168,0.010002666877375709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,8192,0.04910577668084038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,6144,0.00998933364947637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,5120,0.00945955514907837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,7168,0.04393511017163595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,4096,0.007967111137178209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,6144,0.03887288769086202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,3584,0.006999111009968652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,5120,0.03308355477121141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,65536,0.40232356389363605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,3072,0.006616888774765863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,2560,0.006091555373536215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,4096,0.02849777870708042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,128,0.012115555504957834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,3584,0.026538666751649644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,2048,0.0052328887912962176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,3072,0.023767110374238756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,1536,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,1024,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,2560,0.02159022291501363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,768,0.0038319999972979226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,512,0.003536888708670934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,1536,0.01681600014368693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,1024,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,256,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,128,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,768,0.013430222041077085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,64,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,512,0.012748444245921241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,12288,0.012067555553383298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,256,32,0.0029440000653266907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,256,0.012062222593360476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,128,0.012016889121797351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,65536,0.025050666597154405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,64,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,51200,0.018567999203999836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,16384,0.010320000350475311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,32,0.011748444702890186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,12288,0.008956444760163626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,10240,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,16384,0.09606222311655681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,12288,0.07241066959169176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,8192,0.01037333326207267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,51200,0.3154088921017117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,10240,0.061589333746168345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,6144,0.009006222089131674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,8192,0.0490551127327813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,7168,0.04305600126584371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,5120,0.008280889027648503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,6144,0.03854488995340135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,4096,0.0075902218619982404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,3584,0.007245333658324347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,512,32,0.011874666644467248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,5120,0.032920890384250216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,3072,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,2560,0.005899555567238066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,4096,0.028129776318868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,256,2048,0.01923733287387424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,3584,0.026518222358491685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,3072,0.023491554790072974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,1536,0.004536889079544279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,2560,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,1024,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,768,0.003571555432346132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,2048,0.019201777047581144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,512,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,1536,0.016711999972661335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,256,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,1024,0.014781332678265043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,128,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,768,0.013447999954223633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,64,0.0025457777082920074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,32,0.002549333290921317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,256,0.012115555504957834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,128,0.01200977795653873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,64,0.011387555963463254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,65536,0.023694222172101338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,32,0.011364444262451597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,51200,0.016200888488027785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,16384,0.011425777441925473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,65536,0.40026044845581055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,12288,0.008897778060701158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,16384,0.09605333540174697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,10240,0.008003555238246918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,51200,0.3146808942159017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,65536,0.39954755041334367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,8192,0.008350222474998897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,12288,0.07255822420120239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,7168,0.00795999997191959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,6144,0.007655111451943715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,10240,0.06152355670928955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,8192,0.04845866560935974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,5120,0.008683555656009251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,7168,0.042262223031785756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,2048,0.00527555536892679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,4096,0.007649777664078607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,3584,0.006903111106819577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,6144,0.037444445821974016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,3072,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,5120,0.03242222136921353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,2560,0.005888888819350137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,2048,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,4096,0.028139554791980322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,3584,0.02645066711637709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,1536,0.004522666749027041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,3072,0.02351733379893833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,1024,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,2560,0.021291555629836187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,128,512,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,2048,0.0192248887485928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,512,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,1536,0.016757332616382174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,256,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,128,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,1024,0.014469333820872836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,768,0.01310755560795466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,64,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,32,0.002552888873550627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,256,0.012117333710193634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,128,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,64,0.011378666592968835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,32,0.011083555718262991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,51200,0.01550222271018558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,16384,0.01720711092154185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,16384,0.09498933288786147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,65536,0.3995190991295709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,12288,0.013732444081041547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,51200,0.31461599138047963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,10240,0.009358222285906473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,8192,0.008678221868144141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,12288,0.07239377498626709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,10240,0.06094488832685682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,8192,0.04821244544453091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,7168,0.01937599976857503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,6144,0.00795733349190818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,5120,0.012715555727481842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,64,768,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,4096,0.007989333735571967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,6144,0.03780711028310988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,3584,0.007676444119877285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,5120,0.03229599859979417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,64,512,0.012720888687504662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,3072,0.0069653333889113525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,4096,0.028156446086035833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,2560,0.006291555447710886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,65536,0.01942933268017239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,3584,0.026341333985328674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,2048,0.005593777944644292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,128,7168,0.009687110781669617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,1536,0.004688888788223267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,1024,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,3072,0.02360444433159298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,2560,0.021262221866183813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,768,0.003535110917356279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,512,0.003145777723855443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,2048,0.01924444403913286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,256,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,1024,0.014371555712487964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,128,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,768,0.013430222041077085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,64,0.002577777744995223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,512,0.012803555362754397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,769,32,32,0.002748444469438659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,256,0.012114666402339935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,128,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,64,0.011347555451922946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,32,0.011569778124491373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,7168,0.043235556946860425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,16384,0.9263377719455295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,769,32,1536,0.01627288924323188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,16384,1.0902328491210938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,12288,0.7080177730984158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,12288,0.7987982432047526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,10240,0.5617173512776693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,10240,0.6830515331692166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,51200,2.957160101996528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,8192,0.46237866083780926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,16384,0.9622799555460612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,12288,0.731660419040256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,8192,0.5512151188320583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,10240,0.5913262367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,51200,3.7226647271050344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,7168,0.4328044520484076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,6144,0.3341760105556912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,6144,0.39520978927612305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,5120,0.32647376590304905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,5120,0.32958756552802193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,7168,0.42537156740824383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,8192,0.48263735241360134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,4096,0.22198843955993652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,6144,0.3670035468207465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,4096,0.274820433722602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,3584,0.19481778144836426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,7168,0.4842720031738281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,3584,0.23809067408243814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,3072,0.16821066538492838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,5120,0.3139902220831977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,3072,0.20306132899390328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,4096,0.2596195538838704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,2560,0.14351644780900744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,2048,0.11660088433159722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,1536,0.09306577841440837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,2560,0.1757404406865438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,3072,0.20126844777001274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,3584,0.22869600190056694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,2048,0.14665067195892334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,1024,0.07522933350669013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,2560,0.17440622382693818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,768,0.053386665052837796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,2048,0.1467368867662218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,1536,0.11520000298817952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,1024,0.08973689211739434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,512,0.03966755668322245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,1536,0.12056888474358453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,256,0.028672890530692205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,768,0.07344622082180448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,768,0.08320889208051893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,512,0.07032710976070829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,256,0.0587715572781033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,128,0.024714666936132643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,64,0.02113688819938236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,65536,32,0.02148177723089854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,64,0.05487999982304043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,256,0.059143112765418164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,32,0.054449776808420815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,128,0.049689776367611356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,1024,0.09661955303615993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,512,0.06456177764468722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,65536,128,0.05566133393181694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,16384,0.6998977661132812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,65536,51200,3.2493805355495877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,51200,2.5048063066270614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,16384,0.8747182422214084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,65536,3.161283493041992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,12288,0.6093804571363661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,12288,0.6242248747083876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,51200,2.8617163764105906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,65536,3.6099866231282554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,10240,0.4480089081658258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,8192,0.3508728875054254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,16384,0.7917004691229926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,10240,0.5173698001437718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,7168,0.33620089954800075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,8192,0.4270666705237494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,7168,0.3648666540781657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,10240,0.4931013319227431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,6144,0.2729946772257487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,12288,0.5866773393419054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,6144,0.315466668870714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,8192,0.39980265829298234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,5120,0.21872799926333955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,4096,0.17837066120571562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,5120,0.2877359920077854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,4096,0.2374782297346327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,3584,0.16343643930223253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,7168,0.35508177015516496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,6144,0.30660443835788304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,5120,0.25851644410027397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,3072,0.16245155864291722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,3584,0.19272622797224256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,3072,0.1646675533718533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,4096,0.2193759944703844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,3584,0.19305245081583658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,2560,0.14401866330040827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,2048,0.11025777790281509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,3072,0.16904000441233316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,2048,0.119558228386773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,1536,0.0942995548248291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,2048,0.12701155079735651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,1024,0.05464622378349304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,1536,0.10335999727249146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,768,0.04313066601753235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,1024,0.07395022445254855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,1024,0.08280711041556464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,768,0.06088888645172119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,768,0.07214755482143827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,512,0.030826667944590252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,2560,0.13844177458021376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,512,0.05358577768007914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,256,0.02346399923165639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,512,0.06252266963322957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,128,0.01997955474588606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,256,0.051466666989856295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,256,0.04914311236805386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,1536,0.07082933187484741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,51200,2.6694702572292752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,64,0.01812355551454756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,51200,32,0.023100444012218054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,2560,0.14648444122738308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,128,0.044249776336881846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,64,0.04494755466779073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,32,0.044963555203543774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,51200,0.6855502128601074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,65536,1.0076826943291557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,51200,65536,3.3785012563069663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,51200,128,0.046216888560189136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,51200,1.0647155973646376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,16384,0.24743199348449707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,12288,0.17438133557637533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,65536,1.347486178080241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,16384,0.35161778661939835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,10240,0.17909510930379233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,12288,0.24551023377312553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,10240,0.20865866872999403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,16384,0.3550906711154514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,8192,0.13434933291541204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,12288,0.2718577649858263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,8192,0.1655422184202406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,7168,0.11134400632646348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,10240,0.2321235603756375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,6144,0.10006578101052178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,7168,0.1464115513695611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,8192,0.1885359949535794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,6144,0.12860800160302058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,7168,0.1680391099717882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,5120,0.10913333627912734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,6144,0.15342133575015598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,4096,0.06389955679575603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,5120,0.1277208858066135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,3584,0.05661155780156454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,4096,0.09029244714313084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,3072,0.05655466847949558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,4096,0.10929244756698608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,3584,0.08120622237523396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,65536,1.4393795861138239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,3584,0.09852888849046494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,2560,0.04730755421850416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,3072,0.07054577933417426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,2048,0.03899200095070733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,3072,0.08844000101089478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,1536,0.02971733278698391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,2560,0.06397510899437799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,2048,0.06879022386338976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,1024,0.021595555875036452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,2560,0.07808178000979953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,1536,0.041783110962973706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,1536,0.05931555562549167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,768,0.017140444782045152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,1024,0.033145778708987765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,1024,0.04781244529618157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,5120,0.08157155248853895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,512,0.013458666702111563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,768,0.043079998758104115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,256,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,512,0.038455112112893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,256,0.03334310981962416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,768,0.028451555305057104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,256,0.022621333599090576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,64,0.009763555394278632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,128,0.029301332102881536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,128,0.02169688873820835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,32,0.01034222212102678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,64,0.02149066660139296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,32,0.02126311096880171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,16384,51200,1.1169226964314778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,2048,0.05218311150868734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,51200,0.5404417779710557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,65536,0.6882159974839953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,16384,512,0.024271999796231587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,16384,0.18279466364118788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,65536,1.1116924285888672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,16384,0.3044488959842258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,12288,0.19919555717044404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,51200,0.8669546445210775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,16384,0.28483377562628853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,10240,0.10416799783706665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,12288,0.22418488396538627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,8192,0.0862577756245931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,10240,0.16609066062503391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,7168,0.08899377452002631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,8192,0.13711467054155138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,10240,0.18536089526282418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,6144,0.0762959983613756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,8192,0.15379822254180908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,16384,128,0.010519111322032081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,7168,0.1394533316294352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,51200,0.8907146453857422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,12288,0.14251821570926243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,5120,0.06271466943952772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,4096,0.051763554414113365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,6144,0.12212355931599934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,65536,1.1411973105536568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,3584,0.04633333285649618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,5120,0.10653333531485663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,4096,0.07612622446484037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,4096,0.09108089076148139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,3072,0.0396053327454461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,3584,0.07221421930525038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,3584,0.08350933260387844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,2560,0.032257778777016535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,3072,0.057447108957502574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,3072,0.074017776383294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,2048,0.025860443711280823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,2560,0.0518124434683058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,2560,0.06689866383870442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,1536,0.021420444051424663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,2048,0.04431644413206312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,2048,0.0586106644736396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,1024,0.01534844438234965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,1536,0.04964444372389051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,1536,0.03616088959905837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,768,0.01276533305644989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,7168,0.12009510729047988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,1024,0.04203822215398153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,1024,0.028480887413024902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,512,0.010013333625263637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,768,0.025172443853484258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,768,0.03821333249409994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,6144,0.10545955763922797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,512,0.03423733181423611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,512,0.021294222937689886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,256,0.030878222650951807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,256,0.01991911066903008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,64,0.006278222219811545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,12288,128,0.027775999572541978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,32,0.006280000011126201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,128,0.01921688848071628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,5120,0.09186844693289863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,64,0.019151111443837483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,12288,32,0.018917333748605516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,51200,0.42667555809020996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,65536,0.6109075546264648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,16384,0.16562488343980578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,256,0.007607111500369177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,51200,0.7703973452250162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,65536,0.9802595774332682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,12288,128,0.006911110960774952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,12288,0.12362844414181179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,16384,0.24761422475179037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,10240,0.10489955875608657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,12288,0.1755688852734036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,8192,0.07398044400744967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,10240,0.1518239974975586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,12288,0.21646489037407768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,16384,0.28243199984232586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,7168,0.07526666588253446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,10240,0.18733867009480795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,8192,0.12105333805084229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,6144,0.06494844622082181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,8192,0.15339822239345974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,7168,0.10719911257425944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,5120,0.05542133251825968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,7168,0.1365848912133111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,4096,0.04420977830886841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,6144,0.09469422366884019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,6144,0.12306666374206543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,5120,0.10452266534169515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,3584,0.0422017772992452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,65536,1.1132533815171983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,4096,0.06742578082614474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,4096,0.08995378017425537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,3072,0.03664088911480374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,3584,0.06124533547295464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,51200,0.8774782286749946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,2560,0.03092977735731337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,3072,0.05316177672810025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,3072,0.07355644305547078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,2048,0.025568000144428674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,1536,0.02033333314789666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,2560,0.06480089161131117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,2560,0.04571911030345493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,2048,0.057927111784617104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,2048,0.03976000017589993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,1024,0.015867556134859722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,768,0.012989333106411828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,1536,0.048898667097091675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,1024,0.041167110204696655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,1024,0.026311111119058397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,512,0.010130667024188572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,768,0.022867555419603985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,256,0.007740444607204861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,768,0.03734044565094842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,128,0.006697777658700943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,512,0.019768888751665752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,512,0.03308622373474969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,256,0.030140442980660334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,256,0.01841600073708428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,64,0.006623999940024481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,128,0.018031999468803406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,128,0.026434666580624048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,64,0.017851556340853374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,5120,0.08058844672309028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,32,0.01755555636352963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,10240,3584,0.08243466748131646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,65536,0.5221644507514106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,51200,0.3457537757025824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,16384,0.1257057719760471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,10240,1536,0.03193511234389411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,65536,0.8577546543545194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,12288,0.0959706637594435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,16384,0.20522044764624703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,51200,0.6679457558525933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,10240,32,0.006575999988449945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,16384,0.24768267737494576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,10240,0.08859288692474365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,8192,0.07188444667392306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,12288,0.1641306612226698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,10240,0.1296844482421875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,12288,0.1915146642261081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,7168,0.062181333700815834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,10240,0.16198489401075575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,6144,0.053864889674716525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,8192,0.1393102275000678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,7168,0.09673244423336452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,7168,0.12140711148579915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,5120,0.04579200016127693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,6144,0.0851093331972758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,65536,0.9749084048800998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,4096,0.0370488895310296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,5120,0.07233333587646484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,51200,0.7729013231065539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,3584,0.031839112440745033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,4096,0.0803768899705675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,3072,0.028129776318868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,3584,0.07362044519848294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,3584,0.05306844578848945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,2560,0.024650666448805068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,3072,0.04692622356944614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,3072,0.0657164454460144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,2048,0.020050666398472257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,2560,0.05877066983116997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,2560,0.04108177622159322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,1536,0.015784000356992085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,2048,0.03570844398604499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,8192,0.10812622308731079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,1024,0.013027555412716336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,1536,0.029153777493370905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,1536,0.045082665152019925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,768,0.011001778145631155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,1024,0.02366488840844896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,1024,0.03668355610635545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,512,0.008963555925422246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,6144,0.10863910781012641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,768,0.034076445632510714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,256,0.007173333730962541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,5120,0.09331644243664211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,512,0.01826844447188907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,512,0.031748443841934204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,128,0.006625777731339137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,4096,0.0591742197672526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,256,0.029490666257010564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,256,0.01717511150572035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,64,0.006305777778228124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,8192,32,0.006251555350091722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,128,0.01683466633160909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,64,0.016545777519543965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,32,0.016538666354285348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,65536,0.4628888765970866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,51200,0.3509982162051731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,2048,0.05282844437493218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,16384,0.12258844905429417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,65536,0.8044311205546061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,8192,768,0.0210479994614919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,16384,0.19002932972378203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,51200,0.6348240110609267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,12288,0.14607911639743382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,16384,0.24637511041429308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,8192,128,0.02535466684235467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,10240,0.09513777494430542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,12288,0.18931821982065836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,10240,0.1244151062435574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,10240,0.16167822149064806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,8192,0.10229155752393936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,8192,0.13361777199639216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,6144,0.059282667107052274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,7168,0.12087021933661567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,65536,0.9664808909098307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,51200,0.7630142105950249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,5120,0.04874577787187365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,6144,0.08010311259163751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,6144,0.10713155402077569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,5120,0.0684079991446601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,5120,0.09279200103547837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,12288,0.09278933207194011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,3584,0.03455466694302029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,4096,0.055918223328060575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,4096,0.08000000317891438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,3072,0.029041777054468792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,3584,0.07327289051479764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,3584,0.05009777678383721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,2560,0.02457155618402693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,8192,0.07942844761742486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,3072,0.044686221414142184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,2048,0.020755555894639757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,2560,0.039284444517559476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,2560,0.05879200167126126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,7168,0.06793066528108385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,1536,0.017338666650984023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,2048,0.05246577660242716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,2048,0.03411644366052415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,1024,0.011395555403497485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,1536,0.02791022260983785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,7168,0.09178755680720012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,1536,0.044477333625157676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,768,0.009359999663299983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,512,0.007295110987292395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,1024,0.038146668010287814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,768,0.03325600094265408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,768,0.019887111253208585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,256,0.005888000130653381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,512,0.01752711170249515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,512,0.030863109562132094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,128,0.005576000031497743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,256,0.028099556763966877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,256,0.016490666402710807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,64,0.005214222189452913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,128,0.025031111306614343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,32,0.005229333208666907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,128,0.016209777858522203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,64,0.015847111741701763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,32,0.01548266741964552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,7168,3072,0.0655884411599901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,65536,0.40748710102505153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,51200,0.2700977855258518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,16384,0.09655911392635769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,65536,0.7313146591186523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,7168,1024,0.02264533274703556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,16384,0.17516177230411104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,12288,0.07903999752468534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,7168,4096,0.03908266623814901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,10240,0.06285155481762357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,12288,0.13407022423214382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,12288,0.16430221663581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,10240,0.11293155617184109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,8192,0.05077244506941902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,10240,0.140794661309984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,65536,0.8335750897725424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,7168,0.045062220758861966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,8192,0.09332178036371867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,51200,0.6615697542826334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,8192,0.11664799849192302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,6144,0.03854666815863715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,5120,0.03226666649182638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,7168,0.10589510864681667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,6144,0.07360888852013482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,6144,0.09447999795277913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,4096,0.027464000715149775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,5120,0.061326218975914844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,5120,0.08165778054131402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,4096,0.050395554966396756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,4096,0.07091110944747925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,3072,0.02091644373204973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,51200,0.5703333218892416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,3584,0.06556355290942721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,2560,0.01789955629242791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,3072,0.04043289025624593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,16384,0.2116426626841227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,3072,0.058493336041768394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,2048,0.015473778049151102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,2560,0.03616088959905837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,2560,0.05306844578848945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,1536,0.012667555775907306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,2048,0.031629333893458046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,2048,0.04798310995101929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,1024,0.010115555591053432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,1536,0.025399110383457605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,1536,0.04101244608561198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,768,0.00831733312871721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,1024,0.033760888708962336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,1024,0.020727111233605277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,512,0.006610666712125142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,768,0.018858666221300762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,768,0.030885332160525854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,256,0.005780444376998478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,512,0.029491557015313044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,7168,0.08342488606770833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,512,0.016864889197879367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,128,0.004915555732117759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,64,0.004222222086456087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,256,0.027079110344250996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,32,0.004536889079544279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,6144,3584,0.023618666662110224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,6144,128,0.024713777833514746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,128,0.015493333339691162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,64,0.015244444211324057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,32,0.015174221661355762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,3584,0.04533511069085863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,65536,0.3180470996432834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,51200,0.2725626627604167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,16384,0.08504888746473525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,16384,0.1617466608683268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,51200,0.5257813135782877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,12288,0.06655644708209567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,16384,0.21705778439839682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,10240,0.056984000735812716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,12288,0.123233781920539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,12288,0.16826132933298746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,10240,0.10662400060229832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,8192,0.045647111203935414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,10240,0.139646225505405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,51200,0.6506542099846734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,7168,0.04065510961744521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,65536,0.8271635373433431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,8192,0.08766133255428737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,8192,0.11991466416252984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,6144,0.036087112294303045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,5120,0.030282666285832722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,7168,0.07820088995827569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,7168,0.1054133309258355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,6144,0.09447022279103597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,6144,0.06797422303093804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,4096,0.024248000648286607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,3584,0.021588444709777832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,5120,0.05673866801791721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,5120,0.08087911208470662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,3072,0.01956266661485036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,4096,0.07052177853054471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,4096,0.04697688751750522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,3584,0.06490933232837252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,3584,0.04302311274740431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,65536,0.6713582144843208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,2048,0.015003555350833468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,3072,0.03809422254562378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,2560,0.052383999029795326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,2560,0.033929778469933405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,1536,0.012702222499582501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,2048,0.04737155636151632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,2048,0.029494222667482164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,1024,0.009789333575301701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,1536,0.023787554767396715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,1536,0.03901688920127021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,768,0.00794311116139094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,6144,256,0.015862221519152325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,1024,0.03334044416745504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,512,0.00658044425977601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,768,0.017889777819315594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,768,0.030862222115198772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,256,0.005609777652555042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,512,0.028785778416527644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,128,0.0052044445441828836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,256,0.015236443943447538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,128,0.01480888823668162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,128,0.02472177810139126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,64,0.004888888862397936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,32,0.00554666668176651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,64,0.014547554983033074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,32,0.014442667365074158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,3072,0.05827022261089749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,65536,0.2553937700059679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,51200,0.22722665468851724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,1024,0.019899555378490023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,16384,0.07263555791642931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,65536,0.619583977593316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,5120,512,0.016136000553766888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,12288,0.05252888798713684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,51200,0.48339467578464085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,16384,0.15005155404408774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,10240,0.04626577761438158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,16384,0.21001066101921928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,12288,0.11220355828603108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,12288,0.16192532910241023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,8192,0.03557777735922072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,10240,0.09785599841011895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,5120,2560,0.01750666730933719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,65536,0.8195368978712293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,7168,0.03264710969395108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,10240,0.1382933325237698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,6144,0.03141866789923774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,8192,0.08114755815929837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,51200,0.6431422233581543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,5120,0.024883555041419134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,7168,0.07176622417238024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,7168,0.10452089044782852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,6144,0.0632879998948839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,6144,0.11019111341900295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,5120,0.0528675549560123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,5120,0.08043111032909818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,3584,0.02261688808600108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,3072,0.020394666327370536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,4096,0.044284443060557045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,4096,0.06952444712320964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,2560,0.015108444624476962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,3584,0.06458489100138347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,3584,0.040694223509894475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,3072,0.057605332798428006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,3072,0.037752889924579196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,2048,0.01309333327743742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,2560,0.03195377853181627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,1536,0.01033333357837465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,5120,256,0.026828444666332666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,2048,0.028563555743959215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,2048,0.04662222332424588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,1024,0.008295111358165741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,1536,0.038378665844599404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,1536,0.022657778528001573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,768,0.0069226668112807805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,1024,0.03388444582621256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,512,0.005899555567238066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,768,0.01716800034046173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,768,0.031086222993002996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,256,0.004906666775544484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,512,0.015524443652894763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,512,0.02828622195455763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,8192,0.11532710658179389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,128,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,256,0.014793778459231058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,256,0.02605244517326355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,64,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,4096,0.02089866664674547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,128,0.02365600069363912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,128,0.014096889230940076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,64,0.0141004439857271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,32,0.013814222481515674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,65536,0.2256960074106852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,51200,0.2017493380440606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,4096,2560,0.05190222130881416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,16384,0.058584888776143394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,65536,0.5828471183776855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,4096,1024,0.01885955532391866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,51200,0.45348358154296875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,12288,0.04922044608328077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,16384,0.20784800582461885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,12288,0.10760444402694702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,10240,0.04014755619896783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,12288,0.1611457798216078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,8192,0.03374400072627597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,4096,32,0.0041857775714662345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,65536,0.8155786726209852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,10240,0.09202400181028579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,10240,0.13757777214050293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,51200,0.6409217516581217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,7168,0.03056266572740343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,8192,0.07598755757013957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,6144,0.026650667190551758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,8192,0.11487910482618545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,5120,0.02239911092652215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,7168,0.0677715539932251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,7168,0.10393510924445258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,6144,0.05875911315282186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,6144,0.09238577551311916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,4096,0.02033866610791948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,5120,0.04900799857245552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,5120,0.07970755630069308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,3072,0.014654222461912366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,4096,0.04139288928773668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,4096,0.06898488601048787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,3584,0.0381004446082645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,3584,0.06449155675040351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,3072,0.033913777934180364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,3072,0.05727466609742907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,2048,0.011567110816637674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,16384,0.14031999640994602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,2560,0.02994399931695726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,1536,0.009276444713274637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,2048,0.046224001381132335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,1024,0.007262222468852997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,1536,0.021328889661365088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,1536,0.038098666403028704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,768,0.006337777607970768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,1024,0.033137778441111244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,1024,0.01791555517249637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,512,0.005214222189452913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,768,0.016508445143699646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,768,0.03048355711830987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,256,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,512,0.014848889576064216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,512,0.02914311157332526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,128,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,256,0.025642666551801894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,256,0.014256000518798828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,64,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,3584,0.016474665866957772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,32,0.0038311113086011675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,128,0.02381155557102627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,64,0.013813333378897773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3584,2560,0.01309333327743742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,32,0.013724444641007317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,65536,0.22135378254784477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3584,2560,0.051757332351472646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,51200,0.16073155403137207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,2048,0.02640977833006117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,16384,0.05593066745334201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,65536,0.544281800587972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,16384,0.13080622090233698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,12288,0.04169333312246534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,16384,0.17494932810465494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,51200,0.4441208839416504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,10240,0.03557866811752319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,12288,0.09994844595591228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,12288,0.13636710908677843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,10240,0.08678222364849514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,8192,0.026891556051042344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,10240,0.11645510461595322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,7168,0.024031110935741003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,51200,0.5358533329433864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,65536,0.6815564367506238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3584,128,0.013952889376216464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,8192,0.07094666692945692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,6144,0.022652443912294176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,8192,0.09877333376142715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,5120,0.018964444597562153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,7168,0.08871110942628647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,4096,0.01629244453377194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,6144,0.07918666468726264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,6144,0.05471377902560764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,5120,0.045780443482928805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,3584,0.01458044515715705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,3072,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,4096,0.060276442103915744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,3584,0.05626489056481255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,2560,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,3072,0.05106666684150696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,2560,0.046012444628609546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,2048,0.01038933296998342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,2048,0.025399110383457605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,2048,0.041054222318861223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,1536,0.008046222229798635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,7168,0.06270044379764132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,1536,0.020474667350451153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,1024,0.006271111054552927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,5120,0.06944711340798272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,1536,0.03397422366672092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,768,0.0058559998869895935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,4096,0.039232889811197914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,1024,0.017455110947291057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,512,0.00488800017370118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,1024,0.029937777254316542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,3584,0.03594755464129978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,256,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,768,0.02843822373284234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,3072,0.032462222708596125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,128,0.0039048890272776284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,512,0.02678577767478095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,256,0.02502311103873783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,256,0.013864888913101621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,2560,0.028512001037597656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,64,0.003528000166018804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,3072,32,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,128,0.013799111048380533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,64,0.013423999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,32,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,65536,0.17968089050716826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,51200,0.14054132832421198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,65536,0.5292826758490669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,51200,0.4156168831719293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,16384,0.048601776361465454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,16384,0.12929688559638128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,768,0.015784889459609985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,16384,0.1738826698727078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,12288,0.03562577896647983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,3072,512,0.014785778191354541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,65536,0.677478207482232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,51200,0.5342586835225424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,10240,0.03130844566557143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,8192,0.02512977851761712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,12288,0.09493777487013076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,12288,0.13611111376020643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,7168,0.022099556194411382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,10240,0.08509777651892768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,10240,0.11591022544436985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,8192,0.06970400280422635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,8192,0.09735733270645142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,6144,0.019440889358520508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,5120,0.017145777742067974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,7168,0.08811466561423408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,7168,0.06123110983106825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,6144,0.07851111226611666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,4096,0.014803555276658801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,6144,0.053322666221194796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,5120,0.04523288872506884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,5120,0.06885688834720187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,3072,0.01235466698805491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,4096,0.060099555386437305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,4096,0.03863199883037143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,3584,0.035306665632459856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,3584,0.055919110774993896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,2560,0.010727110836240979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,2048,0.009347555538018545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,3072,0.03137600090768602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,2560,0.04379822148217095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,2560,0.027122666438420612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,1536,0.006986666884687211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,2048,0.02404622236887614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,1024,0.005943999936183293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,1536,0.020080000162124634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,1536,0.03427377674314711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,768,0.005290666802061929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,1024,0.029855999681684706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,1024,0.017217778497272067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,512,0.004880889008442561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,3072,128,0.022623111804326374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,512,0.014501333236694336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,256,0.004181333300140169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,512,0.02641777859793769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,256,0.02402577797571818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,256,0.013779555757840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,3584,0.013376889129479727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,128,0.0038293335172865125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,64,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,128,0.013403555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2560,32,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,64,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,3072,0.05016888843642341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,32,0.013305777476893531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,65536,0.14958755175272623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,2048,0.03951822386847602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,51200,0.11353866259256999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,65536,0.491962644788954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,768,0.027781334188249376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,51200,0.38554933336046004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,16384,0.03997066617012024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,12288,0.03028622269630432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,16384,0.11855110857221816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,16384,0.17322933673858643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,12288,0.09109155337015788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,10240,0.025768889321221247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,51200,0.5304373105367025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,65536,0.672327995300293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,8192,0.020907556017239887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,12288,0.1352062225341797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2560,128,0.022327999273935955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,7168,0.018545778261290658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,10240,0.07784089114930895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,10240,0.11526578002505833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,6144,0.01661422186427646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,8192,0.06377955277760823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,5120,0.014143110977278816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,7168,0.08778844277064006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,6144,0.04920266734229194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,6144,0.07764710982640584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,4096,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,5120,0.0687075588438246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,3584,0.011385777758227454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,4096,0.035828444692823626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,4096,0.05951466825273302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,3072,0.010668444136778513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,3584,0.03277511066860623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,3584,0.05471733212471008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,2560,0.009298666483826106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,3072,0.029330667522218492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,3072,0.048082666264639966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,2048,0.008087111016114553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,2560,0.02637333340115017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,2048,0.022666666242811415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,2048,0.03906755646069845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,1536,0.00702400008837382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,1536,0.03396888905101352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,1024,0.005919999960396025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,8192,0.09652977519565159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,7168,0.05533511108822293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,768,0.0052888890107472735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,1024,0.01650399963061015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,1024,0.02979644470744663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,512,0.004555555681387584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,5120,0.04185600082079569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,768,0.014832889040311178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,768,0.027802666028340656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,256,0.0042275554604000514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,512,0.014111111561457316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,512,0.026782222919993933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,256,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,256,0.02472711106141408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2560,768,0.015460444821251763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,64,0.003559999995761447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,32,0.004032000071472592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,128,0.01309333327743742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,128,0.023054222265879314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,64,0.01275022245115704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,65536,0.1259875562455919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,32,0.012724444270133972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,51200,0.09682933489481609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,2048,1536,0.018868444694413077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,65536,0.449635558658176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,16384,0.031097776359981958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,51200,0.35357067320081925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,12288,0.024246222443050806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,16384,0.11006400320265029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,16384,0.17040356000264487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,10240,0.020785777105225455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,12288,0.08384266826841567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,8192,0.017321777012613084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,65536,0.6593679851955837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,51200,0.519604418012831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,10240,0.11350844966040717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,2048,128,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,10240,0.0713813304901123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,8192,0.05784089035458035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,6144,0.013682666752073499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,8192,0.09480622079637314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,7168,0.08580444256464641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,7168,0.051727109485202365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,5120,0.01292711082432005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,6144,0.04423022270202637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,6144,0.07664089070426093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,4096,0.010840888652536603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,5120,0.03920800156063504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,5120,0.06714400317933825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,3584,0.009374221993817223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,4096,0.032567110326555036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,4096,0.05849066707823011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,3072,0.008637333081828224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,3584,0.029542220963372126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,3584,0.0528035561243693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,2560,0.007930667036109501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,3072,0.026556443836953905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,3072,0.047725333107842334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,2048,0.006681777950790193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,2560,0.0236817780468199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,2560,0.04294133186340332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,1536,0.005589333259397083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,2048,0.03923644291030036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,2048,0.021560000048743352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,1024,0.004872888740566042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,12288,0.13242133458455405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,1536,0.017823111679818895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,1536,0.03382133444150289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,768,0.0042275554604000514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,512,0.0041777777175108595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,1024,0.02950577934583028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,7168,0.015481778317027621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,768,0.02777066661251916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,768,0.014168888330459595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,256,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,512,0.013732444081041547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,128,0.0034871109657817413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,512,0.02642400066057841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,64,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,256,0.024340444140964087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,256,0.013103110922707452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1536,32,0.0032266666077905228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1536,128,0.022350221872329712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,128,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,64,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,2048,2560,0.04334133201175266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,65536,0.09050133493211533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,32,0.012418666647540199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,16384,0.025603555970721777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,51200,0.06794933478037517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,16384,0.10797066820992364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,16384,0.16940532790289986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,65536,0.44170488251580137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,12288,0.021048888564109802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,10240,0.018025777406162687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,12288,0.08203999863730536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,51200,0.5154346889919704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,10240,0.07005688879224989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,8192,0.01605244477589925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1536,1024,0.015484443969196744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,10240,0.11227467324998643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,7168,0.014430221584108142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,8192,0.09387999773025513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,8192,0.056891553931766085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,6144,0.01275199982855055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,7168,0.04929511083496941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,5120,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,6144,0.0437448885705736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,6144,0.07612266805436876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,4096,0.008959111240175035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,5120,0.036955555280049644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,4096,0.03154044349988302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,3584,0.008250666989220513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,4096,0.056886222627427846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,3584,0.028804444604449805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,51200,0.34789689381917316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,3584,0.054026666614744395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,12288,0.1316008832719591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,3072,0.046588444047504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,2560,0.0069057775868309875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,65536,0.6544159783257378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,2048,0.005909333212508096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,2560,0.023377777801619634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,2560,0.04249688982963562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,1536,0.005506666584147348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,2048,0.02090666691462199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,2048,0.03838933176464505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,1024,0.004877333425813251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,1536,0.017862222260899015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,1536,0.033258666594823204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,768,0.00423555572827657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,1024,0.029504888587527808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,5120,0.06673600276311238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,768,0.014191110928853353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,512,0.003914666672547658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,768,0.02786488996611701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,512,0.013455111119482251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,256,0.0032275555034478507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,3072,0.007299555672539606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,128,0.0032551110618644287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,256,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,256,0.02365511159102122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,3072,0.02593244446648492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,64,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,128,0.021935999393463135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,1024,32,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,64,0.012100444071822695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,65536,0.0666159987449646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,32,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,51200,0.05518933468394809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,7168,0.08541866805818345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,1024,0.015455999308162265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,65536,0.4024648931291368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,16384,0.02106399999724494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,51200,0.31678133540683323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,12288,0.01982133256064521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,16384,0.0985928906334771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,16384,0.1679635577731662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,65536,0.6521964603000218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,10240,0.0169831116994222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,51200,0.5139608912997776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,8192,0.01459022197458479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,12288,0.13110844294230142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,10240,0.063573333952162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,10240,0.1118133332994249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,7168,0.012924444344308643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,1024,128,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,6144,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,8192,0.09358133210076226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,7168,0.04501510990990532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,5120,0.0101742222905159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,6144,0.03924444317817688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,6144,0.07596444421344332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,4096,0.00868444475862715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,5120,0.03383200036154853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,5120,0.06501866711510552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,3584,0.007975111405054728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,4096,0.029472000069088403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,4096,0.056399113602108426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,3072,0.007289778027269576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,3584,0.026884444885783728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,3584,0.05180266830656263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,2560,0.006584888945023219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,3072,0.024396444360415142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,3072,0.046741333272722035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,2048,0.005655999812814925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,2560,0.021885333789719477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,12288,0.0747671127319336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,2560,0.042098667886522084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,1536,0.0052577778697013855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,2048,0.038346668084462486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,1024,0.004538666870858935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,1536,0.016873778568373788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,1536,0.03321866525544061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,768,0.0038968887594011095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,8192,0.05095644460784065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,1024,0.014774221513006421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,512,0.0038444445365005066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,1024,0.02879200047916836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,7168,0.08548977639940049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,256,0.003206222214632564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,768,0.013796444568369122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,512,0.02574488851759169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,512,0.012740444805887012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,128,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,256,0.024682665864626568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,256,0.01240355521440506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,64,0.0031439999325407874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,768,32,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,128,0.021606221795082092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,128,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,64,0.011766222616036734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,65536,0.0466231107711792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,32,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,51200,0.03889244463708665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,1024,512,0.02641777859793769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,16384,0.01939733326435089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,65536,0.40175822046067977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,768,2048,0.01955911186006334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,12288,0.0162426663769616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,16384,0.09529155492782593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,16384,0.16752178139156768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,51200,0.5114835633171929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,10240,0.014885332849290637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,12288,0.07418400049209595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,8192,0.013394667042626275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,12288,0.1306826670964559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,768,768,0.02676800058947669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,7168,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,10240,0.11197688844468857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,8192,0.04974844389491611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,8192,0.09381066428290473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,6144,0.010882666541470421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,7168,0.04469155602984958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,7168,0.08481866783565944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,5120,0.009434666898515489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,6144,0.038535998927222356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,6144,0.07485689057244195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,4096,0.007995555798212687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,5120,0.03356711069742838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,3584,0.007415999968846639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,5120,0.065920889377594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,4096,0.0558791094356113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,4096,0.028724445237053767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,3072,0.0069653333889113525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,3584,0.026426666312747534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,3584,0.05167288912667168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,2560,0.006224888894293044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,51200,0.3161999914381239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,3072,0.0466213325659434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,2048,0.005608888963858287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,2560,0.02162488963868883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,2560,0.042039109600914844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,1536,0.005227555417352253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,2048,0.01924000018172794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,2048,0.03804088963402642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,1024,0.0041991112132867174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,1536,0.016480889585283067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,1536,0.03299377693070306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,768,0.003899555653333664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,1024,0.028804444604449805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,10240,0.06255555815166898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,512,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,768,0.027072888281610277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,256,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,512,0.0251866661840015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,512,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,128,0.0031946665710873077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,256,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,256,0.02329155637158288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,64,0.003137777869900068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,128,0.011781333221329583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,512,32,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,64,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,32,0.011401777466138205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,65536,0.03141422073046366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,3072,0.02399377855989668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,51200,0.029135111305448744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,65536,0.6501519944932725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,65536,0.3999342123667399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,16384,0.013472889032628802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,1024,0.014779556128713818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,51200,0.3153662151760525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,512,768,0.013775111072593264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,12288,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,65536,0.6462666723463271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,10240,0.01071999967098236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,16384,0.1670453283521864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,12288,0.07361066341400146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,12288,0.13082044654422337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,51200,0.510042667388916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,8192,0.00962577760219574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,10240,0.0617413322130839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,7168,0.009024000002278222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,512,128,0.021314667330847845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,10240,0.11123022768232559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,6144,0.008648888932334052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,8192,0.04932889011171129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,8192,0.09318400091595119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,7168,0.04320444332228767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,5120,0.007961778177155389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,6144,0.07542310820685492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,4096,0.007941332956155142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,6144,0.037682665718926325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,5120,0.06390577554702759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,5120,0.03315555718210008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,4096,0.055790219042036265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,4096,0.02906222144762675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,3072,0.006700444552633498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,3584,0.051410665114720665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,3584,0.026128000683254663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,2560,0.005904888941182031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,3072,0.023511111736297607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,3072,0.04619733492533366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,2048,0.005574222240183089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,2560,0.02136444383197361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,2560,0.041816890239715576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,1536,0.004576888763242298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,2048,0.03780444463094076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,16384,0.09646133581797282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,1024,0.003976888954639435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,1536,0.03263466556866964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,1536,0.01646933290693495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,768,0.0039022221333450745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,1024,0.028836445675955877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,512,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,768,0.013343999783198038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,512,0.02535999980237749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,512,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,256,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,7168,0.08508088853624131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,128,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,256,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,3584,0.007258666886223688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,128,0.011780444118711682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,128,0.021253334151373968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,256,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,64,0.01180355581972334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,65536,0.026513778501086768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,32,0.011577777564525604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,51200,0.018571555614471436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,2048,0.019261333677503798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,256,1024,0.014481777946154276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,65536,0.3994346724616156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,768,0.026410667432679072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,16384,0.01238044434123569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,12288,0.010229333407349056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,65536,0.6475093099806044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,16384,0.16784977912902832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,12288,0.07264800204171075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,51200,0.5096622043185765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,10240,0.009759999811649323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,256,256,0.0229777776532703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,8192,0.008791111409664154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,12288,0.13049156135982937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,7168,0.00830844458606508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,10240,0.061439110173119434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,10240,0.11141422059800889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,8192,0.09256088733673096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,8192,0.04807022213935852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,6144,0.00795111142926746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,5120,0.007592889169851939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,7168,0.04345422320895725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,7168,0.08369333214230007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,6144,0.03767733441458808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,4096,0.007648000286685095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,5120,0.03297777639495002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,5120,0.06332177586025663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,3584,0.007606222397751278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,4096,0.0280675556924608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,4096,0.05528444382879469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,3072,0.006275555739800136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,3584,0.026221333278550044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,3584,0.05118844575352139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,2560,0.005937777873542573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,3072,0.023581332630581323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,3072,0.04604444570011563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,2048,0.005218666460778978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,51200,0.31457776493496364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,2560,0.021543999512990315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,2560,0.04168355464935303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,1536,0.00452533322903845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,2048,0.018944889307022095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,1024,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,16384,0.09646844201617771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,1536,0.032532443602879844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,768,0.0038844446341196695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,1536,0.016539555456903245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,1024,0.02882666720284356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,1024,0.014474666780895658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,768,0.026776888304286536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,768,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,256,0.0029031110720502008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,512,0.025016888976097107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,512,0.01240888900227017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,128,0.0028524444335036804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,256,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,64,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,128,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,128,0.020978666014141504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,32,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,6144,0.07266666491826375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,65536,0.02570488883389367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,64,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,51200,0.01923199991385142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,128,32,0.011398221883508893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,16384,0.009701333112186855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,12288,0.008623110751310984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,16384,0.09562222162882487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,12288,0.0725511113802592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,10240,0.009292444421185387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,65536,0.39957332611083984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,51200,0.31466934416029185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,8192,0.008616888688670265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,7168,0.007991111112965478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,6144,0.007613333563009898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,2048,0.03765599926312765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,10240,0.06116888920466105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,8192,0.04913599954711067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,5120,0.008275555239783393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,7168,0.04210933380656772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,4096,0.007315555380450354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,3584,0.0069448889957533936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,128,512,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,3072,0.006903999795516332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,2560,0.006573333508438534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,5120,0.03258400162061056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,4096,0.02808622188038296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,2048,0.005225777626037598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,1536,0.004375111311674118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,3072,0.023670223024156358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,1024,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,2560,0.021241777473025854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,768,128,256,0.023678221636348303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,768,0.003469333259595765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,1536,0.01626844373014238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,512,0.003456888927353753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,1024,0.01457155578666263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,256,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,768,0.013439111411571503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,128,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,512,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,256,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,64,0.00254133323000537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,64,32,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,128,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,65536,0.019166222876972623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,64,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,32,0.011083555718262991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,51200,0.012714666624863943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,16384,0.014145778285132514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,16384,0.09511911206775242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,65536,0.398601770401001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,6144,0.03714488943417867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,51200,0.31410490141974556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,10240,0.008617777791288164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,8192,0.008454221818182204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,3584,0.02608000073168013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,7168,0.007948444121413762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,6144,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,12288,0.07212533553441365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,10240,0.06082666582531399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,8192,0.04797777864668104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,5120,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,64,2048,0.018983110785484314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,4096,0.007340444458855524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,3584,0.007321777443091075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,7168,0.0432293348842197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,3072,0.0069431112044387394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,6144,0.03713511096106635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,2560,0.00692622239391009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,5120,0.03252799974547492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,2048,0.005209777918126848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,1536,0.004575110971927643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,3584,0.02628533376587762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,3072,0.023430221610599097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,1024,0.0039013334446483185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,2560,0.021313778228229944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,768,0.0035537779331207275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,2048,0.019156444403860304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,512,0.0032302221904198327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,1536,0.0162426663769616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,1024,0.01443822185198466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,768,0.013389333254761167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,128,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,512,0.012410666379663678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,64,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,256,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,128,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,64,0.011360000405046674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,32,0.011074666347768573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,12288,0.009663999908500248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,768,32,4096,0.02787644333309597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,16384,0.7317137718200684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,256,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,16384,0.7985715336269803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,768,32,32,0.002642666714058982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,12288,0.5034631093343099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,10240,0.48192442788018125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,8192,0.40270222557915586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,12288,0.6652755737304688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,10240,0.48775021235148114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,8192,0.40049155553181964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,6144,0.26768000920613605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,7168,0.3831537829505072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,5120,0.21580178207821318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,6144,0.2984631061553955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,51200,2.4039279090033636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,4096,0.19417156113518608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,3584,0.15317511558532715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,5120,0.2801671028137207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,4096,0.21062400605943468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,3072,0.1396604379018148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,2560,0.11531644397311741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,2048,0.09078577491972183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,51200,2.7375982072618275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,1536,0.0753484434551663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,1024,0.055252446068657764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,2048,0.11529955599043105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,3584,0.18587288591596815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,3072,0.154968884256151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,768,0.043565332889556885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,1536,0.08964533276028103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,512,0.03149155444569058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,1024,0.07086488935682508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,7168,0.3166337807973226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,128,0.021381333470344543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,768,0.058555556668175586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,512,0.051009777519438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,64,0.01757422255145179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,256,0.04589510957400004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,32,0.018223999275101554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,64,0.04223111271858215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,32,0.04144622219933404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,16384,0.5287466579013401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,2560,0.13524799876742893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,65536,256,0.02334755493534936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,65536,128,0.044032000833087497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,12288,0.4090880023108588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,16384,0.6384551260206435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,51200,1.8795706431070964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,10240,0.3394062254163954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,12288,0.4686364597744412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,10240,0.3899075455135769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,8192,0.32051555315653485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,7168,0.25300267007615834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,51200,2.136384963989258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,65536,2.4318169487847223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,8192,0.32548620965745717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,7168,0.27454400062561035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,6144,0.2669351100921631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,5120,0.17167199982537162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,4096,0.14379378159840903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,65536,2.6762604183620877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,3072,0.11078044441011216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,3584,0.14488089084625244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,3584,0.1361644400490655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,5120,0.22105244795481363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,4096,0.16372444894578722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,2048,0.08696177932951187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,1536,0.06797333558400472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,1024,0.05107466710938347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,2560,0.09399288892745972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,2048,0.09199111329184638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,768,0.0354053344991472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,1536,0.07452799876530965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,512,0.027310222387313843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,2560,0.1101564433839586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,1024,0.05786044730080498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,256,0.020460445019933913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,768,0.04873155554135641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,128,0.016514667206340365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,64,0.014799111419253878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,512,0.04191999965243869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,256,0.036658667855792575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,51200,32,0.015127999915017022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,128,0.03490755624241299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,64,0.034613334470325045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,6144,0.23908265431722006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,32,0.03440444336997138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,16384,0.18592800034417045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,16384,0.24087201224433052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,12288,0.1315457820892334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,51200,3072,0.1258266634411282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,51200,0.5487964418199327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,65536,0.7277333471510145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,8192,0.10217689143286811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,12288,0.18157511287265352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,10240,0.15245955520206028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,51200,0.7963884671529134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,7168,0.0909644431538052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,6144,0.07570577992333306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,5120,0.06752444638146295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,65536,0.9877893659803602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,4096,0.056052446365356445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,6144,0.09787022405200535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,3584,0.050048887729644775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,4096,0.06889600223965116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,3072,0.04269422094027201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,2560,0.03655111127429538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,3584,0.0624177787039015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,5120,0.08376889096366034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,2048,0.02940888868437873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,3072,0.05564177698559231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,1536,0.02346222268210517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,2560,0.04948355423079597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,1024,0.017311111092567444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,2048,0.040935112370385066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,768,0.014849777022997538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,512,0.012176888684431711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,1536,0.033278223541047834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,256,0.009003555609120263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,768,0.024335111180941265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,128,0.007318221860461765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,512,0.021520000365045335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,64,0.006870222174459034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,32,0.006573333508438534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,16384,10240,0.11987466282314724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,128,0.018923555811246235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,64,0.01889866590499878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,32,0.018890667292806838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,8192,0.1342737807167901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,65536,0.4575786590576172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,51200,0.38297687636481387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,12288,0.09470933013492161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,51200,0.6350480185614692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,65536,0.8021333482530383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,12288,0.16223288906945124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,10240,0.08047911193635729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,1024,0.027851555082533095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,8192,0.07423288954628839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,7168,0.05946755409240723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,10240,0.1258257759941949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,256,0.01979555520746443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,8192,0.10294222169452244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,5120,0.04826400015089247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,7168,0.09322133329179551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,4096,0.03863733344607883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,6144,0.08006578021579318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,3584,0.032855110036002264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,16384,7168,0.1114506721496582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,3072,0.029956443442238703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,4096,0.05771644247902764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,2560,0.025794666674402025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,16384,0.12195821603139241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,3584,0.050669332345326744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,2048,0.02174577779240078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,1536,0.017083555459976196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,3072,0.045498665836122304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,1024,0.013062222136391534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,2560,0.04117155406210158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,2048,0.03492088781462775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,768,0.011005333728260465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,512,0.008763555851247575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,1536,0.028927998410330877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,1024,0.023715555667877197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,768,0.021252445048756067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,512,0.018951111369662814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,256,0.017529777354664274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,64,0.005233777893914117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,128,0.01718755563100179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,32,0.0052355556852287715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,6144,0.05260799990759956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,64,0.016892444756295946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,32,0.016851555969980028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,5120,0.07043288813696967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,65536,0.5183164278666178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,51200,0.4070524374643962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,16384,0.13301422860887316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,65536,0.7192933294508191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,256,0.006615110983451207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,12288,0.10602044396930271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,12288,16384,0.21572444174024794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,16384,0.17619289292229545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,12288,128,0.005610666755172942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,51200,0.5617306497361925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,10240,0.08742222521040176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,8192,0.07137066788143583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,7168,0.06251377529568143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,12288,0.1329537762535943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,6144,0.05386755532688565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,5120,0.04609955681694878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,8192,0.09308089150322808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,7168,0.08182933595445421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,10240,0.11635733975304498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,3584,0.033858666817347206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,6144,0.07199022505018446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,5120,0.061816891034444175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,2560,0.02478133307562934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,4096,0.05072177780999077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,2048,0.0203484445810318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,3584,0.045738667249679565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,3072,0.04122311207983229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,1536,0.016757332616382174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,1024,0.01275199982855055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,2560,0.03700088792377048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,768,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,2048,0.030870222383075293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,512,0.008560889297061497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,1536,0.026759111218982275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,256,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,1024,0.022011554903454248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,768,0.019903111788961623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,128,0.005574222240183089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,64,0.005202666752868229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,512,0.017849778135617573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,32,0.005223999834722943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,256,0.016904888881577384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,128,0.016184000505341422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,64,0.015915556086434256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,10240,32,0.01581333412064446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,16384,0.09351466761695014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,12288,0.0760400030348036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,65536,0.37607110871209043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,16384,0.15091821882459852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,10240,0.06542222367392646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,4096,0.03812177644835578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,12288,0.11629599995083278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,51200,0.48769246207343203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,8192,0.05397866831885444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,7168,0.045808888143963285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,10240,0.09871021906534831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,10240,3072,0.02996622191535102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,5120,0.03379644287957086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,8192,0.08182666699091594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,7168,0.07209955321417914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,4096,0.027969777584075928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,6144,0.06382666693793403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,3584,0.024697777297761705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,5120,0.054153776831097074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,3072,0.021963554951879714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,2560,0.018799111247062683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,2048,0.016136889656384785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,4096,0.044590221510993115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,3584,0.040793776512145996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,3072,0.03678399986690945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,2560,0.033245331711239286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,1024,0.010645333263609143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,2048,0.02781955401102702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,768,0.009313777916961247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,1536,0.024401777320437964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,512,0.007280000381999546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,1024,0.019852444529533386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,256,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,768,0.018195556269751657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,128,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,512,0.016640888320075143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,51200,0.2704186704423693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,64,0.004537777768241035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,256,0.016009777784347534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,32,0.004869333157936732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,128,0.015458666616015963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,32,0.01515111161602868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,64,0.015473778049151102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,8192,65536,0.6154470973544651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,6144,0.04091822107632955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,65536,0.33870845370822483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,16384,0.08577511045667861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,51200,0.26347290145026314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,12288,0.063664886686537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,16384,0.14131822850969103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,10240,0.058028446303473584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,8192,0.044497778018315635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,12288,0.10774755477905273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,8192,1536,0.013422222601042854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,7168,0.03854399919509888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,51200,0.4502408769395616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,65536,0.5733333163791233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,10240,0.09192799859576756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,6144,0.03320622113015916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,8192,0.076200889216529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,5120,0.028703110085593328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,4096,0.02681866619322035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,3584,0.022456000248591106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,3072,0.01993955506218804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,6144,0.06334311432308622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,5120,0.05013688736491733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,4096,0.04180533356136746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,2048,0.014831110835075378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,3584,0.03828444414668613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,3072,0.0348053342766232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,1536,0.012331555287043253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,1024,0.009995555712117089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,2560,0.03262133399645487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,2048,0.026520000563727483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,768,0.008469333251317343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,1536,0.02270577847957611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,1024,0.018923555811246235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,256,0.005507555686765247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,768,0.018201778332392376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,128,0.004546666724814309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,512,0.016150222884284127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,64,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,256,0.015489778584904142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,32,0.004552000098758274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,128,0.015448888142903646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,64,0.014779556128713818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,32,0.014484445254007975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,65536,0.24199199676513672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,51200,0.22669778929816353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,16384,0.06878755489985149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,12288,0.04724444283379448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,16384,0.12986132833692762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,65536,0.5288044611612955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,51200,0.41376622517903644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,2560,0.017808000246683758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,7168,7168,0.06753510899013944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,8192,0.03580977850490146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,12288,0.0995360016822815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,7168,0.028949333561791316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,6144,0.027495111028353374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,5120,0.02289155622323354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,10240,0.08535289102130467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,8192,0.07039378086725871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,7168,0.061271111170450844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,4096,0.018794667389657762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,3584,0.01698933376206292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,7168,512,0.006697777658700943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,3072,0.015336889359686108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,5120,0.04645244280497233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,2560,0.013430222041077085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,4096,0.03889866669972738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,2048,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,1536,0.009979555176364051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,3072,0.032650666104422674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,1024,0.008294222255547842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,2560,0.02975911233160231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,2048,0.024923556380801733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,1536,0.02142222225666046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,512,0.005560889012283749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,1024,0.017895999881956313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,256,0.004591111093759537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,768,0.01683644453684489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,128,0.004242666479614046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,512,0.015512888630231222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,256,0.015173332558737861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,64,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,128,0.014448889427714877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,32,0.0038853333228164246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,64,0.01443911095460256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,10240,0.047192888127432935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,32,0.014089778065681458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,65536,0.2605822351243761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,6144,0.05434222353829277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,6144,3584,0.03610666592915853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,16384,0.06894844770431519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,65536,0.4806506898668077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,12288,0.05444622370931837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,6144,768,0.006637333167923822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,10240,0.04647022154596117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,16384,0.1180773311191135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,8192,0.03771555423736572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,51200,0.38047112358940977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,12288,0.09120444456736247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,7168,0.033955554167429604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,10240,0.07864177889294095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,6144,0.0291955570379893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,5120,0.024746666351954143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,8192,0.06451911396450467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,4096,0.019924443629052904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,7168,0.056458665264977344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,3584,0.018403554956118267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,6144,0.04987466666433546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,5120,0.04331022169854906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,4096,0.03641600079006619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,2560,0.014019555515713163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,2048,0.012335110869672565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,3072,0.03042666779624091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,1536,0.01036444471942054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,1024,0.008473777936564552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,2560,0.028115553988350764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,768,0.006937777830494775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,2048,0.023215999205907185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,512,0.00555377784702513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,1536,0.020255110330051847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,1024,0.01715377800994449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,256,0.004984000076850255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,128,0.004522666749027041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,512,0.0151582227812873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,51200,0.21321954992082384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,64,0.004182222402758068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,256,0.014476444986131458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,32,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,128,0.013824000126785703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,64,0.013808888693650564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,32,0.013740444348918067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,65536,0.2067955599890815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,51200,0.17545066939459908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,65536,0.432785775926378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,51200,0.340939548280504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,16384,0.10682400067647298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,5120,3072,0.016145777371194627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,12288,0.04595288965437147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,10240,0.03798222210672166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,8192,0.0314337776766883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,3584,0.03360711203681098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,7168,0.027667555544111464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,12288,0.08300355407926771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,6144,0.023853333459960088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,10240,0.07102044423421223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,5120,0.020302222834693063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,8192,0.05828622314665052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,4096,0.017051556044154696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,7168,0.051184889343049794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,3584,0.01575555569595761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,6144,0.044808000326156616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,3072,0.014121777481502958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,5120,768,0.016162667009565566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,2560,0.012335110869672565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,4096,0.0336097776889801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,2048,0.010586666564146677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,1536,0.008961777720186446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,3072,0.028446220689349707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,2560,0.02606755495071411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,1024,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,2048,0.02130222154988183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,768,0.006220444622966979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,1536,0.018933332628673978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,512,0.005201777650250329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,256,0.004566222015354368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,1024,0.01648355523745219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,768,0.015248888068728976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,128,0.004553777890072929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,512,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,16384,0.057766218980153404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,256,0.014078223043017916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,32,0.0036106668412685394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,128,0.013414222333166333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,64,0.013415111435784234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,32,0.013096888860066732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,65536,0.17700800630781385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,51200,0.16262400150299072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,16384,0.04920088913705614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,12288,0.03804088963402642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,65536,0.41672266854180234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,16384,0.10516711076100667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,51200,0.3299173249138726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,10240,0.03377244538731045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,12288,0.08177510897318523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,5120,0.039573334985309176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,8192,0.02734755476315816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,7168,0.023073777556419373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,4096,3584,0.031152000029881794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,10240,0.06964088810814752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,8192,0.057258665561676025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,7168,0.050663110282686025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,4096,0.015962666935390897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,6144,0.0444124440352122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,5120,0.038889778984917536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,3072,0.01309333327743742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,4096,0.0333315564526452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,4096,64,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,2560,0.011702222128709158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,2048,0.009977777798970541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,3584,0.030478222502602473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,1536,0.008253333469231924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,3072,0.027632888820436265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,2560,0.02553155521551768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,1024,0.006704000135262807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,2048,0.021176000436147053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,768,0.005913777897755305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,1536,0.018583999739752877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,1024,0.016233777006467182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,256,0.004211555752489301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,768,0.015132443772421943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,128,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,512,0.014468444718254937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,64,0.0032595555401510666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,256,0.013775111072593264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,128,0.013119999733236102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,64,0.013075555364290873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,6144,0.020563556088341605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3584,32,0.013099555340078143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,5120,0.018212444252438016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,65536,0.16444355911678737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,16384,0.045385777950286865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,51200,0.14609777927398682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,3584,0.014256000518798828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,12288,0.0354693333307902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,10240,0.030216889248953924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,51200,0.30339378780788845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,65536,0.3829795519510905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,12288,0.0744382209248013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,8192,0.02456355591615041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,7168,0.0214008887608846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,6144,0.01901955571439531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,8192,0.05160444312625461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,512,0.00488711107108328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,7168,0.04538044333457947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,5120,0.016564443707466125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,4096,0.013944000005722046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,3584,0.012809777425395118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,6144,0.04069955481423272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,3072,0.011494222614500256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,5120,0.0358897778722975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,4096,0.030656887425316706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,2560,0.010286221901575724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,3584,0.028524445162879095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,2048,0.008967111508051554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,1536,0.007600888609886169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,3072,0.025813332862324182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3584,32,0.003536000019974179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,1024,0.005888888819350137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,2560,0.022882666852739122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,768,0.005542222410440445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,2048,0.019539554913838703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,512,0.004865777575307422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,1536,0.01752711170249515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,256,0.0038986665507157645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,1024,0.015480889214409722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,128,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,768,0.01479022204875946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,64,0.003478222423129611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,512,0.014132445057233175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,3072,32,0.003481777591837777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,256,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,128,0.01308444473478529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,64,0.012805333567990197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,32,0.012720000412729053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,65536,0.16203822029961482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,51200,0.1296008825302124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,16384,0.09553422530492146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,16384,0.04660177893108792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,12288,0.03521600034501817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,10240,0.029934220843844946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,3072,10240,0.06309866905212402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,8192,0.024824000067181055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,16384,0.0942408906088935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,51200,0.29717334111531574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,65536,0.37575199868943954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,12288,0.07310933536953397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,10240,0.061944888697730176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,6144,0.019132445255915325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,5120,0.01664977769056956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,4096,0.014210666219393412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,8192,0.0502106679810418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,7168,0.04514044523239136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,3584,0.013334222137928009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,6144,0.03971022367477417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,3072,0.01220266686545478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,5120,0.035571555296579994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,4096,0.030135111676322088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,2560,0.010616000327799054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,2048,0.00902133352226681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,3584,0.027896000279320612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,3072,0.024567999773555334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,2560,0.02274311085542043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,1024,0.005903111149867375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,768,0.005320888840489917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,1536,0.017469333277808297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,512,0.004576000074545543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,768,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,256,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,512,0.014099554883109199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,128,0.003546666767862108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,256,0.013136000268989138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,64,0.0032426667296224167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,128,0.012798222402731577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,32,0.0032684444967243406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,7168,0.02242044442229801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,64,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,32,0.012473777764373355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,51200,0.1303724447886149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,65536,0.1631759934955173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,16384,0.04513422316975064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,12288,0.032305777072906494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2560,1536,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,16384,0.08403288655810887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,51200,0.26753687858581543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,10240,0.028485334581798975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,2048,0.0192266669538286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,8192,0.02381155557102627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,12288,0.06491377618577746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,7168,0.020592888196309406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,6144,0.01923022170861562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,10240,0.05491288834147983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2560,1024,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,5120,0.0158933334880405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,8192,0.044885334041383534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,4096,0.013398222625255585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,3584,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,6144,0.03658933440844218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,3072,0.010683555569913654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,2560,0.009357333183288574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,4096,0.02701688806215922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,3584,0.024745777249336243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,2048,0.008143111235565608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,3072,0.022646221849653456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,1536,0.006981333096822103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,2560,0.020679111282030743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,2048,0.018223111828168232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,768,0.00489777781897121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,1536,0.01648977730009291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,1024,0.014494222071435718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,512,0.004237333519591225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,256,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,768,0.01407911048995124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,128,0.0031866667171319327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,512,0.013407111167907715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,64,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,256,0.012835555606418185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,32,0.0032239999208185407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,128,0.01276711126168569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,64,0.012101333174440594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,65536,0.335843563079834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,32,0.012168889244397482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,65536,0.09892888863881429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,16384,0.03158400124973721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,7168,0.04070666763517592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,16384,0.08261155419879489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,12288,0.025609778033362493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,65536,0.33056889639960396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,2048,5120,0.032495998673968844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,10240,0.02181422213713328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,8192,0.01865600049495697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,7168,0.01684799955950843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,2048,1024,0.005910222315125995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,12288,0.06368088722229004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,10240,0.053118222289615206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,8192,0.04418311185306973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,6144,0.014767999450365702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,5120,0.013334222137928009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,4096,0.011967110964987012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,7168,0.03995111253526475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,3584,0.0107351111041175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,6144,0.03583022289805942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,3072,0.009669333696365356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,5120,0.0317795541551378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,2560,0.00830666638082928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,4096,0.026160889201694067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,2048,0.007610666255156199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,3584,0.024999999337726172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,1536,0.006256888724035687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,3072,0.02267644471592373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,1024,0.005224888937340842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,2560,0.020595555504163105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,2048,0.017852443787786696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,768,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,1536,0.01625333395269182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,512,0.0038746665749284956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,1024,0.01423111061255137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,768,0.013797333670987023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,512,0.013394667042626275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,128,0.0034871109657817413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,64,0.003140444349911478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,51200,0.08177333407931857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,32,0.003228444399105178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,128,0.012314666476514606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,64,0.01202933324707879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,51200,0.26094399558173287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,65536,0.06427288717693753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,51200,0.05210666524039375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,16384,0.02165511084927453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,65536,0.2884391148885091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,51200,0.22779199812147352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,12288,0.018358222312397428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,10240,0.01908533275127411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,8192,0.015459555718633862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,12288,0.055101331737306386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,10240,0.04634844594531589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,7168,0.015452444553375244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,6144,0.013711111413107978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,8192,0.03900266687075297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,5120,0.010827555424637265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1536,256,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,7168,0.0351493325498369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,4096,0.009348444640636444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,6144,0.031535999642478094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,3584,0.00868000007337994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,5120,0.027570666538344488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,256,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,4096,0.02366666661368476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,2560,0.007326222128338284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,3584,0.02234399980968899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,2048,0.0064106666379504735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,1536,0.005598222215970357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,2560,0.018927110566033255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,2048,0.016509332590632968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,1024,0.004549333204825719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,768,0.0041893331540955436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,1536,0.015411555767059326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,512,0.003690666622585721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,1024,0.013778666655222574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,256,0.0034871109657817413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,768,0.013423999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,128,0.002993777808215883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,512,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,64,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,16384,0.07190666596094768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,256,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,32,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,128,0.01204533295498954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,65536,0.051538666089375816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,64,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,51200,0.04215022259288364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,32,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,16384,0.018233777748213876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,12288,0.015771556231710646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,16384,0.07090489069620769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,65536,0.28636267450120717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,51200,0.22559467951456705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,10240,0.014296889305114746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,12288,0.05396711164050632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,1024,3072,0.00792266676823298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,8192,0.015844444433848064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,7168,0.014783999986118741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,6144,0.011169777976142036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,5120,0.010344888601038191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,10240,0.045957333511776395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,8192,0.03763822383350796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1024,3072,0.02029333346419864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,7168,0.03435466686884562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,6144,0.03033155534002516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,3584,0.00794488853878445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,3072,0.007272000114123027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,1536,32,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,5120,0.027122666438420612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,2560,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,4096,0.023306666149033442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,2048,0.006304889089531369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,1536,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,3584,0.021899556120236714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,3072,0.019952888290087383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,1024,0.004556444370084339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,768,0.0041999999019834726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,2560,0.01889333294497596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,1536,0.0151235560576121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,1024,0.013643555343151093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,256,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,128,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,512,0.012772444221708508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,64,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,256,0.012130666938092975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,32,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,64,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,32,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,65536,0.03821600145763821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,4096,0.008340444829728868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,65536,0.2854062186347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,51200,0.031670222679773964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,16384,0.014582221706708273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,2048,0.016494222813182406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,16384,0.06988800234264798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,12288,0.014492443866199918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,768,0.013075555364290873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,10240,0.013125333521101209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,8192,0.013799111048380533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,12288,0.05312622255749173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,10240,0.04440444376733568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,768,128,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,8192,0.03728977839152018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,5120,0.008991111483838823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,7168,0.03348088926739163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,4096,0.007981333467695449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,6144,0.029969778325822618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,3584,0.007305777735180325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,5120,0.027101332942644756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,3072,0.006603555546866522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,4096,0.023053333163261414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,2560,0.00620888877246115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,3584,0.021958221991856892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,2048,0.005385777602593104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,3072,0.020038222273190815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,1536,0.004903111192915174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,2048,0.016197333733240765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,1024,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,1536,0.015145777000321282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,768,0.003903999924659729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,51200,0.22502401140001085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,1024,0.013408888545301227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,512,0.0035004446076022256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,256,0.0032355555643637977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,512,0.012720000412729053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,128,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,256,0.012121777567598553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,6144,0.010585777461528778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,64,0.002879111096262932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,32,0.002983999955985281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,128,0.011502222054534487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,65536,0.02569599946339925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,32,0.011459555890825061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,51200,0.023011555274327595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,65536,0.2849484549628364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,2560,0.01866755551762051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,16384,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,51200,0.22394310103522408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,12288,0.011085333095656501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,10240,0.010010666317409938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,16384,0.06911910904778375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,768,512,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,12288,0.051860445075564914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,8192,0.010392000277837118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,7168,0.009673777553770278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,10240,0.04396977689531115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,6144,0.009020444419648912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,768,0.013445333474212222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,5120,0.008627555436558193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,8192,0.036502222220102944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,7168,0.032913777563307024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,4096,0.007602666815121968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,3584,0.007250666618347168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,6144,0.029807110627492268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,3072,0.006562666760550604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,512,7168,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,2560,0.005959110955397288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,5120,0.026799110902680293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,4096,0.022982221510675218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,2048,0.0059262220230367445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,3584,0.02160444524553087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,1536,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,1024,0.0038924444880750445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,3072,0.019902222686343722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,768,0.003604444364706675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,2560,0.018616000811258953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,512,64,0.011545778148704104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,2048,0.016172443826993305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,1536,0.015100444356600443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,256,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,1024,0.013417777915795645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,768,0.013061333033773633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,64,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,512,0.012448000411192576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,32,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,256,0.012073777616024017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,65536,0.019311111834314134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,51200,0.017197334104114108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,32,0.011773332953453064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,16384,0.01203644441233741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,65536,0.2836915651957194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,51200,0.22369511922200522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,12288,0.01012711144155926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,16384,0.0684151119656033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,10240,0.009688888986905416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,8192,0.008651555412345463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,12288,0.050789333052105375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,10240,0.04407555527157254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,7168,0.009356444080670675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,6144,0.008991111483838823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,7168,0.03288977675967746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,5120,0.00796088907453749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,6144,0.029510223203235205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,4096,0.007823111282454597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,512,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,3584,0.007252444823582967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,256,128,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,5120,0.026741334133678015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,3072,0.00657155571712388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,4096,0.023030221462249756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,2560,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,128,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,2048,0.0052435555391841466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,3584,0.0214035560687383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,1536,0.004556444370084339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,3072,0.019910222954220243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,1024,0.0038720000949170855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,768,0.0038133333954546186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,2048,0.01608711149957445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,1536,0.015045333239767285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,1024,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,768,0.012806221842765808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,256,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,128,0.002805333377586471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,512,0.012450666891203986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,64,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,256,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,128,0.011346666349305047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,64,0.011679111255539788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,8192,0.03595911131964789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,32,0.011399110986126794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,51200,0.014120888378885059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,65536,0.2842462327745226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,51200,0.22322132852342394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,16384,0.009681777821646797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,12288,0.012406222522258759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,256,64,0.01165066659450531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,16384,0.06879378027386136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,128,2560,0.018583110637134977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,12288,0.05105244451098972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,8192,0.009706666900051964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,512,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,7168,0.009199110998047723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,6144,0.00868000007337994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,10240,0.042803555727005005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,8192,0.035635554128222995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,5120,0.008095111283991072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,4096,0.007345777418878343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,6144,0.029263112280103896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,128,32,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,3584,0.006976889239417181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,5120,0.02647200061215295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,3072,0.0063164445261160536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,2560,0.005616888817813661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,65536,0.016519111063745286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,3584,0.021290666527218286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,2048,0.005170666509204441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,1536,0.0042071110672420925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,3072,0.019751111666361492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,1024,0.0038293335172865125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,2560,0.018266666266653273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,2048,0.016140444411171805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,768,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,512,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,1536,0.014889778362380134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,256,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,768,0.01309511148267322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,128,0.0026666666898462507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,64,0.002500444443689452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,256,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,32,0.002534222271707323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,128,0.01182755579551061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,64,10240,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,64,0.011074666347768573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,65536,0.03621244430541992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,32,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,51200,0.028809779220157202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,16384,0.010406222608354356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,12288,0.020939555433061387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,16384,0.06804711288876004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,7168,0.03272711237271627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,65536,0.28416445520189076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,51200,0.2233511077033149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,10240,0.017847999930381775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,12288,0.050761779149373375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,8192,0.015125332607163323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,7168,0.014090667168299357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,6144,0.012505778008037143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,4096,0.023020444644822016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,5120,0.01130311108297772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,10240,0.04249599907133314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,8192,0.03555555476082696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,4096,0.008905777500735389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,3584,0.008392888638708327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,7168,0.03269066744380527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,6144,0.029438220792346533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,3072,0.0076044441925154785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,2560,0.005656888915432825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,5120,0.026425777210129633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,4096,0.022981334063741896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,2048,0.004917333523432414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,3584,0.021720889541837905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,3072,0.019659555620617337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,1024,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,2560,0.018237334158685472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,1024,0.013431111143694984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,2048,0.015867556134859722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,768,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,512,0.0032142222755485107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,1536,0.01478488908873664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,64,512,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,256,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,128,0.0028071111689011254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,768,0.01309866706530253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,64,0.0028106667515304354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,512,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,32,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,256,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,128,0.011372444530328115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,64,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,32,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,16384,0.6352266735500759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,513,32,1536,0.0042160000238153665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,16384,0.7076329125298394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,513,32,1024,0.01313066648112403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,12288,0.46172089046902126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,12288,0.5265635384453667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,10240,0.3628222147623698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,51200,2.1514044867621527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,10240,0.43683822949727374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,8192,0.3267253239949544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,51200,2.383967081705729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,8192,0.3497137758466933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,7168,0.27686044904920787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,12288,0.4864071210225423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,7168,0.30746756659613717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,6144,0.26214755905999076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,16384,0.6431271235148112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,10240,0.40257599618699813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,6144,0.26885777049594456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,5120,0.22201777829064262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,7168,0.2915457884470622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,4096,0.15521866745418972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,5120,0.22842489348517525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,8192,0.3284817801581489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,3584,0.13255822658538818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,6144,0.2580213281843397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,3584,0.1623964442147149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,4096,0.18594043784671357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,5120,0.21629956033494738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,3072,0.126310216055976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,2560,0.11606489287482367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,4096,0.1806346707873874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,2048,0.09125066465801662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,2560,0.12373422251807319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,3584,0.1605279975467258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,1536,0.06083289119932386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,3072,0.142941329214308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,2048,0.10260533624225193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,2560,0.12425422668457031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,1536,0.08216533395979139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,1024,0.048904889159732394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,2048,0.10621955659654404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,768,0.03693688909212748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,512,0.02771111163828108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,1024,0.06504178047180176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,1536,0.08899466858969794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,1024,0.07254133621851604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,768,0.05401866634686788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,768,0.06436089012357923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,128,0.01937955617904663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,512,0.05564177698559231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,256,0.020058666666348774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,512,0.047763556241989136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,256,0.04657511247528923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,64,0.016565332810084026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,65536,32,0.016680889659457736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,128,0.04143911268975999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,128,0.03962755534383986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,32,0.03813777698410882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,64,0.03837777839766608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,3072,0.14193333519829646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,65536,256,0.0427724454138014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,16384,0.4615902370876736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,51200,1.6414871215820312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,65536,2.1628053453233504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,65536,51200,2.206537882486979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,51200,1.8920124901665583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,16384,0.5854969024658203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,65536,2.3143378363715277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,12288,0.40860711203681094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,10240,0.29951466454399955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,12288,0.45330402586195206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,10240,0.35101866722106934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,8192,0.24303200509813097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,8192,0.2859235604604085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,7168,0.21498666869269478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,12288,0.38968533939785427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,7168,0.2487724357181125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,6144,0.18143910831875273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,8192,0.26807554562886554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,16384,0.5222213533189561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,5120,0.1724239985148112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,10240,0.329910225338406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,6144,0.21665510866377088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,5120,0.20219377676645914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,7168,0.2388311227162679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,6144,0.20796088377634683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,4096,0.15499288505978054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,3584,0.1285368866390652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,5120,0.17866133319007027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,3584,0.1326568921407064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,4096,0.14861867162916395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,3072,0.11685155497656928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,2560,0.09646933608584934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,3072,0.12087999449835883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,3584,0.13445511129167345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,2048,0.07513778077231513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,4096,0.123325334654914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,2560,0.10145866870880127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,1536,0.06211821900473701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,2560,0.10684888892703587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,2048,0.08406488762961493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,1024,0.04334400097529093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,2048,0.09046577745013767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,1536,0.06816533539030287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,1536,0.07804799742168851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,3072,0.11553155051337348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,768,0.030981332063674927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,1024,0.05454488926463657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,512,0.024263999528355066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,51200,1.7664462195502386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,1024,0.06269866890377469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,768,0.05612444215350681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,768,0.04519288738568624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,128,0.016546666622161865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,512,0.03932266765170627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,512,0.048466665877236255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,256,0.04165510998831855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,64,0.016003555721706815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,256,0.021820444199774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,128,0.03715199894375271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,51200,32,0.01628177695804172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,64,0.0321395562754737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,256,0.03478399912516276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,128,0.03270488977432251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,51200,0.45499112870958114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,65536,0.6288302209642198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,16384,0.16821600331200492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,51200,0.7123973104688855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,65536,0.8944791158040365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,51200,65536,2.2926372951931424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,12288,0.11486221684349908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,16384,0.22973865932888457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,10240,0.0963840021027459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,12288,0.16874844498104521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,51200,32,0.031832890378104314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,8192,0.09084088934792413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,10240,0.14407377772861057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,7168,0.07016088565190633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,16384,0.24700445599026152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,8192,0.11486221684349908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,6144,0.07123733229107328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,10240,0.16131733523474798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,8192,0.1338977813720703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,12288,0.19368444548712838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,7168,0.1035626663102044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,5120,0.060673779911465116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,4096,0.04926133486959669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,6144,0.09059466918309529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,5120,0.07915466361575656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,6144,0.10712622271643744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,5120,0.0938897795147366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,4096,0.06370666954252455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,51200,0.7501689063178169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,4096,0.07993600103590223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,3072,0.038471112648646034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,2560,0.03195910983615451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,3584,0.058352887630462646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,3584,0.07367999686135186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,2048,0.0247653325398763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,3072,0.06748088863160875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,3072,0.05242222216394213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,2560,0.045848889483345874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,2560,0.061287111706203885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,1536,0.020774222082561918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,1024,0.01650044487582313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,2048,0.05288355549176534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,2048,0.0372995568646325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,65536,0.9707981745402018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,1536,0.04612177941534254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,768,0.012884444660610624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,512,0.009974222216341231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,1024,0.027684445182482403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,1024,0.039819555150138006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,768,0.03728888763321771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,256,0.007706666986147563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,512,0.03314933180809021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,512,0.020278222031063504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,128,0.006603555546866522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,256,0.0292231109407213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,256,0.018588445252842374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,64,0.005617777920431561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,128,0.018223111828168232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,7168,0.12141511175367568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,32,0.005944889038801193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,16384,3584,0.044284443060557045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,64,0.017866666118303936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,32,0.017958222164048087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,65536,0.4580373234219021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,51200,0.3586408827039931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,1536,0.03182044294145372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,16384,0.13920711146460638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,65536,0.7347866694132487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,16384,768,0.024724443753560383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,12288,0.10553955369525486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,16384,0.181877334912618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,51200,0.5875537660386827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,12288,0.1396053367190891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,10240,0.08561155531141494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,16384,0.20823110474480522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,10240,0.11851644515991211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,8192,0.08068622483147515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,12288,0.16137422455681696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,7168,0.07008888986375597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,10240,0.13861332999335393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,8192,0.09661155276828343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,8192,0.11610310607486302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,7168,0.08597777949439155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,7168,0.10484533177481757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,6144,0.07626133494906955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,5120,0.04722133278846741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,65536,0.8050462404886881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,51200,0.63263824250963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,4096,0.040292445156309344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,5120,0.06712088982264201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,5120,0.0822311109966702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,16384,128,0.02644444505373637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,4096,0.05426488982306587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,4096,0.0712968905766805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,3072,0.03132889005872939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,3584,0.06510755750868055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,3584,0.04861422379811605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,2560,0.026130666335423786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,3072,0.04401333464516533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,3072,0.05985599756240845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,2048,0.021577777134047613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,2560,0.054755555258856885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,2560,0.0391244457827674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,2048,0.03231822119818793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,1536,0.01593777702914344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,2048,0.048285331990983754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,1024,0.013224889006879596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,768,0.011513777905040316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,1536,0.027843554814656574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,1536,0.041793776883019336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,1024,0.03549066517088149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,512,0.009678222239017487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,6144,0.060876442326439746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,256,0.007273777491516537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,768,0.020305777589480083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,768,0.03325422273741828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,512,0.03071555495262146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,512,0.018248889181349013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,256,0.02718222141265869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,6144,0.09395022524727716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,128,0.016872000363137987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,12288,128,0.024860444996092055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,32,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,64,0.016523554921150208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,3584,0.036200000180138484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,32,0.016152888536453247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,65536,0.4044364558325873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,51200,0.32513777414957684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,65536,0.6496062278747559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,1024,0.023025777604844835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,16384,0.10845155848397149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,128,0.006575111299753189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,51200,0.5107315381368002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,12288,256,0.01682844426896837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,16384,0.1627031167348226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,12288,0.08667466375562881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,12288,64,0.006233777850866318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,10240,0.07821866538789538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,12288,0.12441155645582412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,8192,0.06320266591178046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,10240,0.10572977860768636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,7168,0.05321422219276428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,12288,0.15956532955169678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,8192,0.08637244171566433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,8192,0.11441511578030056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,6144,0.04735022121005588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,7168,0.07675288783179389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,7168,0.10407377613915338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,5120,0.03484088844723172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,6144,0.06851822137832642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,4096,0.032672888702816434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,6144,0.09286844730377197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,5120,0.058952000406053334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,51200,0.625016901228163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,5120,0.08187911245557997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,3584,0.028997331857681274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,4096,0.04821066723929512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,4096,0.06923111279805501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,3072,0.024831111232439678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,3584,0.04301066531075371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,2560,0.021420444051424663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,3072,0.05923910935719808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,3072,0.03930044505331252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,2048,0.01777777738041348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,2560,0.0350853337181939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,2560,0.05418489045566983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,1536,0.0136808885468377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,2048,0.029779556724760268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,16384,0.2050924433602227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,2048,0.04690222276581658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,1024,0.010671111444632212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,1536,0.04150399896833632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,1536,0.025482666161325242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,768,0.009337777892748514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,1024,0.021317332983016968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,1024,0.03642311029964023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,512,0.007251555720965068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,768,0.018942221999168396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,768,0.03195733494228787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,256,0.005955555372767978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,512,0.02883022361331516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,512,0.01716711123784383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,128,0.005567111074924469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,256,0.016159110599093966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,64,0.0052044445441828836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,65536,0.7987288898891873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,128,0.02511288887924618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,128,0.015838222371207345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,10240,32,0.0052800000541739995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,64,0.015509333875444202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,10240,32,0.015821332732836407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,3584,0.06420533524619208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,65536,0.2563199996948242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,51200,0.24533245298597547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,16384,0.08525155650244819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,10240,0.13727733823988172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,65536,0.5732408629523383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,51200,0.45213598675198025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,12288,0.056185775332980685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,16384,0.145651552412245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,10240,0.05836888816621569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,12288,0.10891822311613296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,16384,0.17203822400834826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,10240,256,0.026724444495307073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,8192,0.04804977774620056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,12288,0.13385244210561117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,10240,0.09381066428290473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,7168,0.036397334602144026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,8192,0.07397688759697808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,10240,0.11600889099968804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,8192,0.09781333472993638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,6144,0.03700800074471368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,7168,0.06876177920235528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,5120,0.031088001198238794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,7168,0.08915644221835667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,6144,0.059454222520192467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,51200,0.5192835595872667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,4096,0.0254737784465154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,6144,0.08012266953786214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,5120,0.051860445075564914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,65536,0.6577235327826606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,3584,0.020456888609462313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,3072,0.019883554842736986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,4096,0.060292442639668785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,4096,0.04275555411974589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,3584,0.05650933583577474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,2560,0.016843555702103507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,2048,0.014187556174066333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,3072,0.05232355660862393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,3072,0.03531377845340305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,1536,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,2560,0.031769778993394636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,2048,0.04201066825124952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,1024,0.009764444496896531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,1536,0.023102222217453852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,1536,0.03717866539955139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,768,0.008269333177142674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,1024,0.03325244453218248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,768,0.01757066614098019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,512,0.006671999891599019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,768,0.030248890320460003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,512,0.016235555211702984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,256,0.005250666704442766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,5120,0.07125600179036458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,256,0.01568177839120229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,128,0.004585777719815572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,3584,0.038557334078682795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,256,0.025639999243948195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,64,0.004527111020353106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,128,0.01510933372709486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,8192,32,0.004584889031118817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,128,0.023369777533743117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,2560,0.04797955685191684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,64,0.014761777387724983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,2048,0.02676533328162299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,65536,0.30401333173116046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,51200,0.24634843402438691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,65536,0.5465244187249078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,8192,512,0.027708444330427382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,16384,0.08098133405049641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,51200,0.4261733425988092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,16384,0.13252888785468206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,12288,0.06523466772503324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,16384,0.17029778162638345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,12288,0.10281866788864136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,10240,0.05369155605634054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,12288,0.13378577762179905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,32,0.014814222852389017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,8192,0.04549333453178406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,10240,0.09076533052656387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,65536,0.6533288955688477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,7168,0.04115466607941522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,51200,0.5147751172383627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,10240,0.11500799655914307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,8192,0.07455822494294909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,6144,0.03560533457332187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,8192,0.09762755367490981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,5120,0.030127998855378892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,7168,0.0660053359137641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,7168,0.08902400069766575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,4096,0.025202666719754536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,6144,0.05833244323730469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,6144,0.0792071090804206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,5120,0.04988266693221199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,3584,0.022320000661744013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,5120,0.07038222418891059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,3072,0.019867555962668527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,4096,0.05992888742023044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,4096,0.04140799906518724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,2560,0.01754666699303521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,3584,0.056120885743035205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,2048,0.01535555554760827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,3072,0.03452444407675002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,3072,0.05215733249982198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,2560,0.031150221824645996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,1536,0.013020444247457715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,2048,0.04177422324816386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,2048,0.02622311148378584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,1024,0.010334221853150262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,1536,0.02230577833122677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,1536,0.03738044367896186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,768,0.008623110751310984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,1024,0.018545778261290658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,1024,0.031558222240871854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,512,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,768,0.017208000024159748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,768,0.030142221185896132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,256,0.00574311117331187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,512,0.02676800058947669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,128,0.005208000126812193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,256,0.026686223016844854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,8192,1024,0.019270223047998216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,64,0.0047066667013698155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,128,0.024023110667864483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,128,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,7168,32,0.006268444574541516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,64,0.014140443669425117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,32,0.014123555686738757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,3584,0.03792444533771939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,65536,0.26673867967393666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,7168,2560,0.047650665044784546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,51200,0.19713955455356172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,16384,0.07673955625957914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,65536,0.5033466551038954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,51200,0.3940257761213515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,12288,0.051720887422561646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,16384,0.1265182230207655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,10240,0.04376444551679823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,16384,0.16873866981930205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,512,0.01552177800072564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,7168,256,0.01482399966981676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,8192,0.039729777309629656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,12288,0.09845866759618123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,12288,0.13282310962677002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,7168,0.03477511141035292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,10240,0.08432622088326348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,10240,0.11462310949961345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,8192,0.06913689110014173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,6144,0.02839822239345974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,8192,0.09700710905922784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,5120,0.023967110448413428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,7168,0.06157422065734863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,7168,0.08838044272528754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,4096,0.02017155620786879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,51200,0.51346222559611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,6144,0.07904711034562853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,5120,0.04583644535806444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,65536,0.6499146885342068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,5120,0.06980711221694946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,4096,0.03906222184499105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,3072,0.01705333259370592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,4096,0.05970133013195462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,3584,0.055861334005991616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,2560,0.014470222923490735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,3072,0.0517084432972802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,2048,0.013043555948469373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,2560,0.047261334127850003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,2560,0.029575109481811523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,1536,0.00998399986161126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,2048,0.024846222665574815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,2048,0.0415653321478102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,1024,0.008669333325492011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,1536,0.021333333518770006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,1536,0.03632888860172696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,768,0.0075235557225015424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,1024,0.017834666702482436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,1024,0.03162489003605313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,512,0.006245333287451003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,768,0.016480889585283067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,768,0.029816001653671265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,256,0.005218666460778978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,512,0.015265777707099915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,512,0.02706844442420536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,128,0.004591111093759537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,256,0.01421333352724711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,256,0.025362667110231187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,64,0.00453333349691497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,128,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,6144,128,0.023306666149033442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,32,0.004546666724814309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,3584,0.03571288784344991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,64,0.014119999276267158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,3072,0.03257333238919576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,32,0.013788444300492605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,65536,0.19767467180887857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,51200,0.13900355497996011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,16384,0.04883644315931532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,65536,0.46087646484375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,16384,0.1161786715189616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,12288,0.04244622257020739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,16384,0.1679768827226427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,12288,0.09052799807654487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,6144,6144,0.05344444513320923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,10240,0.03419466813405355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,6144,3584,0.019275556008021038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,8192,0.03162755568822225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,51200,0.5074382358127171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,10240,0.07738577657275729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,12288,0.1319084432390001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,65536,0.6437830924987793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,7168,0.027998222245110407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,10240,0.11476000150044759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,6144,0.024199111594094172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,8192,0.06309955649905734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,8192,0.09565955400466919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,5120,0.02053511142730713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,7168,0.056088891294267446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,6144,0.04842311143875122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,7168,0.08742400010426839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,6144,0.07811644342210558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,4096,0.017328888177871704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,3584,0.015207999282413058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,5120,0.06910755236943562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,5120,0.04226400123702156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,3072,0.013770666387346057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,4096,0.05911466810438368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,4096,0.03615377677811517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,2560,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,3584,0.03325155708524916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,3584,0.05515999926461113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,2048,0.010969777901967367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,3072,0.030288888348473444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,3072,0.051424887445237905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,1536,0.009339555270142024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,2560,0.027748444014125403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,1024,0.007237333390447829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,2048,0.04088711076312595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,1536,0.019928889142142404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,768,0.006098666538794835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,1024,0.030857778257793848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,1024,0.016873778568373788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,512,0.005256888767083486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,768,0.029500444730122883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,768,0.015808888607554965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,256,0.004500444564554426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,512,0.014775110615624322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,512,0.027348443865776062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,128,0.003867555409669876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,256,0.014193778236707052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,256,0.02607733342382643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,64,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,128,0.013435555828942193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,128,0.024132443798912898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,5120,32,0.003921777837806278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,64,0.013742222554153867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,32,0.013439111411571503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,65536,0.19966399669647217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,51200,0.36260800891452366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,51200,0.13601956102583143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,5120,2048,0.023131555981106226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,16384,0.052413334449132286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,65536,0.42095200220743817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,1536,0.03660444418589274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,12288,0.03990488913324144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,51200,0.32905954784817165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,16384,0.1049928863843282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,10240,0.033313777711656355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,16384,0.1349617772632175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,12288,0.0801360011100769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,8192,0.027450667487250432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,10240,0.07032089100943671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,10240,0.09319288863076104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,65536,0.5081209076775445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,8192,0.056645333766937256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,7168,0.023102222217453852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,51200,0.4043742285834418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,8192,0.07843466599782307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,6144,0.02070577773782942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,5120,0.017460443907313876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,7168,0.0720871090888977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,7168,0.05031999945640564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,6144,0.0651093324025472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,6144,0.04431822233729892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,5120,0.03911644551489089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,5120,0.05810133616129557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,3584,0.01349955548842748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,5120,2560,0.047100444634755455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,3072,0.012695111334323883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,3584,0.04765955607096354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,3584,0.030856887499491375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,2560,0.011400889191362592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,3072,0.028444445795483057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,3072,0.04424444503254361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,2048,0.009639110830095079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,2560,0.025723555021815833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,2560,0.04107111030154758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,1536,0.007647111184067196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,2048,0.02161066730817159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,2048,0.034392890002992414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,12288,0.10679022471110027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,1024,0.006175111151403851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,1536,0.018639999959203932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,1536,0.030880000856187608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,768,0.005555555638339784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,1024,0.028099556763966877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,1024,0.016153777639071148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,512,0.004855999930037392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,768,0.015111999379263984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,256,0.004226666771703296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,512,0.024728889266649883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,512,0.014114666316244336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,128,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,4096,0.01514844430817498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,256,0.013744889034165276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,256,0.02365155518054962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,64,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,4096,32,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,128,0.013136000268989138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,4096,0.03303111261791653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,64,0.012832889126406776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,4096,32,0.013108444710572561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,65536,0.16048622131347656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,51200,0.11852533287472194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,65536,0.41513776779174805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,16384,0.04604533314704895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,16384,0.10356355375713772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,768,0.027408889598316614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,16384,0.13349778122372097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,12288,0.035177777210871376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,10240,0.030584000878863867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,65536,0.5039813253614638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,51200,0.3980871041615804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,12288,0.1063271098666721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,8192,0.024816888901922438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,128,0.02239466706911723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,10240,0.06947910785675049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,10240,0.09262310796313816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,4096,4096,0.05030044582155016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,7168,0.021818665994538203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,6144,0.018767999278174508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,8192,0.054810666375690036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,8192,0.07801600297292073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,5120,0.016214221715927124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,7168,0.07129955291748047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,7168,0.04930577675501505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,6144,0.04331288735071818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,4096,0.014020444618331062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,6144,0.06477510929107666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,3584,0.012824888858530255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,5120,0.03848888807826572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,5120,0.0579013360871209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,3072,0.011395555403497485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,4096,0.03267644511328803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,4096,0.05004355642530653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,2560,0.010619555910428366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,3584,0.030478222502602473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,3584,0.04709688822428385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,2048,0.009318222602208456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,3072,0.04245866669548882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,3072,0.027760000692473516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,51200,0.3246542347802056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,2560,0.039340443081325956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,2048,0.020862221717834473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,2048,0.0339662233988444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,1024,0.006258666515350342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,1536,0.018010665973027546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,1536,0.031000001562966242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,768,0.005261333452330695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,1024,0.015807110402319167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,1024,0.028350220786200628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,512,0.004872888740566042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,768,0.027066666218969557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,256,0.004261333495378494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,512,0.014123555686738757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,512,0.024728889266649883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,128,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,256,0.013455111119482251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,256,0.02496355606449975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,64,0.003528888854715559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,128,0.013076444466908773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3584,128,0.021928000781271193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,32,0.003830222205983268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,64,0.013112000293201871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,32,0.01277955538696713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,65536,0.15475822819603816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,51200,0.11275111304389106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3584,1536,0.007921777665615082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,2560,0.025035555164019268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,65536,0.37599910630120176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,16384,0.04294044441647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,51200,0.29504089885287815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,16384,0.09513155619303386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,12288,0.03307377629809909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,16384,0.13355288240644667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,10240,0.027285334136750963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,12288,0.07693155606587727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,65536,0.5022115707397461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,12288,0.07389866643481784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,12288,0.10615999831093682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,8192,0.022385777698622808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,10240,0.06298755274878608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,7168,0.019484443797005545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,8192,0.07755288812849256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,8192,0.051368888881471425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,6144,0.01720177796151903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,7168,0.07106044557359484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,7168,0.04498666524887085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,5120,0.015088000231319003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,6144,0.0407608879937066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,6144,0.06458489100138347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,4096,0.012967111335860359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,5120,0.035775999228159584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,5120,0.05754399961895413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,3584,0.012062222593360476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,4096,0.03052088949415419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,4096,0.04996000064743889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,3072,0.010989333192507425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,3584,0.028070221344629925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,3584,0.0469706654548645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,2560,0.00961688905954361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,3072,0.025811556312772963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,3072,0.04292800029118856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,2048,0.008356444537639618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,2560,0.023706666297382776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,2560,0.03923377725813124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,1536,0.0069679998689227635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3584,768,0.01479022204875946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,1024,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,2048,0.03401688734690348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,2048,0.01945955554644267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,1536,0.030795554320017498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,1024,0.02823288904296027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,1024,0.01513777838812934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,512,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,768,0.014459555347760519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,10240,0.09219111336602105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,768,0.027224888404210407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,256,0.0041804446114434134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,512,0.013752889302041797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,512,0.025067556235525344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,128,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,256,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,256,0.024687111377716064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,64,0.0035208890007601846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,128,0.02199111051029629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,128,0.01275022245115704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,64,0.012787555654843649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,32,0.012738666600651212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,65536,0.13018043835957846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,51200,0.1017635530895657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,65536,0.37209333313835996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,768,0.005222222043408289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,51200,0.29155998759799534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,16384,0.03821244504716661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,3072,51200,0.3965680069393582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,16384,0.09362844626108806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,65536,0.5019769138760036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,12288,0.029437333345413208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,16384,0.1331804460949368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,10240,0.02316355539692773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,12288,0.07283822033140394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,3072,32,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,8192,0.019711999429596793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,12288,0.1052008867263794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,10240,0.06157155831654867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,10240,0.0916551086637709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,7168,0.017473777135213215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,6144,0.015435554915004306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,8192,0.07753155628840129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,8192,0.05048444535997179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,7168,0.04417066772778829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,7168,0.07108000251981947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,5120,0.013783999615245394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,6144,0.04015200005637275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,4096,0.011995555626021491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,6144,0.06419289112091064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,3584,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,5120,0.05737244420581394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,4096,0.04939111073811849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,4096,0.029954665237002905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,3072,0.010007999837398529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,3584,0.027124444643656414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,3584,0.046557333734300405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,3072,1536,0.01721333298418257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,3072,0.02464444438616435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,2048,0.007603555917739868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,2560,0.02294933299223582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,2560,0.038316445218192205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,1536,0.006583999842405319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,2048,0.0192248887485928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,2048,0.034499555826187134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,1024,0.005565333283609814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,1536,0.01686044368478987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,1536,0.030821333328882854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,768,0.004851555658711327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,51200,0.39548532168070477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,1024,0.0151235560576121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,1024,0.027433777848879497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,512,0.004212444441186057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,768,0.014157333307796054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,768,0.02718577782313029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,512,0.013573333621025085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,512,0.02568888829814063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,128,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,256,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,256,0.023560888237423364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,64,0.003485333174467087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,128,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,32,0.003489777859714296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,128,0.02233422299226125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,64,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,65536,0.09706844223870172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,2560,0.008864888714419471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,32,0.012459555433856117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2560,3072,0.04343822267320421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,51200,0.0814302232530382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,16384,0.034908443689346313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,65536,0.33536444769965273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,51200,0.2638817893134223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,16384,0.08409777614805435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,12288,0.025676444172859192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,16384,0.13049422370062932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,12288,0.10335822237862481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,12288,0.06458489100138347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,65536,0.4907653596666124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2560,256,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,8192,0.018753778603341844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,10240,0.08983111381530762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,7168,0.016965332958433364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,8192,0.04463466670778063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,8192,0.07568355401357015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,6144,0.01515111161602868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,7168,0.04003555576006571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,7168,0.07020444340176053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,5120,0.013187555803192986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,6144,0.03634399837917752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,6144,0.06304711103439331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,4096,0.011357333097192975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,5120,0.03230399886767069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,5120,0.056438220871819385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,3584,0.010199111368921068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,4096,0.02701688806215922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,4096,0.04682133264011807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,3072,0.009484444227483537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,3584,0.02557955516709222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,3584,0.04389955600102743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,2560,0.008281778130266402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,3072,0.023431999815834895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,3072,0.04071022073427836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,51200,0.38834577136569554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,2048,0.007313778003056844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,2560,0.020810667011472914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,2560,0.037666665183173284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,1536,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,2048,0.033611555894215904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,10240,0.05483822358979119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,1024,0.0052693333062860705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,1536,0.030621333254708186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,1536,0.016171556380059984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,768,0.00452622233165635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2560,5120,0.03542044427659776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,1024,0.027473777532577515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,512,0.003910222401221593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,768,0.026826666461096868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,768,0.013754666679435305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,256,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,512,0.01313688854376475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,512,0.024331554770469666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,128,0.003913777983850903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,256,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,256,0.024375999967257183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,64,0.0035582222044467926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,2048,128,0.021596444977654353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,128,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,32,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,64,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,65536,0.0864480005370246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,32,0.012106666962305704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,51200,0.07088533374998304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,2048,10240,0.02260444396071964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,16384,0.02796622117360433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,65536,0.3272266652848986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,2048,0.017880888448821176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,51200,0.25723910331726074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,12288,0.019799111617936026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,16384,0.08172000116772123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,10240,0.017137777474191453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,16384,0.12980443901485866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,2048,1024,0.014440000057220459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,8192,0.0144213338692983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,12288,0.06379999717076619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,65536,0.48667287826538086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,51200,0.38608445061577695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,7168,0.013576000101036496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,10240,0.0889822244644165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,6144,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,8192,0.07530311081144545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,8192,0.043806221750047475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,5120,0.010592888626787396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,7168,0.039694223139021136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,7168,0.06912355290518866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,4096,0.009316444396972656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,6144,0.03531555665863885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,6144,0.0620959997177124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,3584,0.008678221868144141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,5120,0.031565331750445895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,4096,0.04597155584229363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,4096,0.026501332720120747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,3072,0.00759733302725686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,3584,0.043268445465299815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,2560,0.0069466663731469055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,3072,0.022288888692855835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,3072,0.04049688908788893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,2048,0.00599911105301645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,2560,0.021147555775112573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,2560,0.03799022237459818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,1536,0.00555377784702513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,2048,0.017847110827763874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,2048,0.03354133168856303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,1024,0.004567111117972268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,1536,0.016138666205936007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,12288,0.10310933325025771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,1024,0.014316444595654806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,1024,0.027758222487237718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,10240,0.05254311031765408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,512,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,768,0.013795555465751223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,768,0.02674666709370083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,256,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,512,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,512,0.02527644402450985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,128,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,5120,0.0555902189678616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,256,0.022649778260125056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,64,0.003463111196955045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,128,0.012435555458068848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,128,0.02164977788925171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,3584,0.024688000480333965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,32,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,65536,0.056129780080583364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,64,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,32,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,51200,0.04497866829236349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,65536,0.28676533699035645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,16384,0.01923377811908722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,51200,0.2256008783976237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1536,768,0.004540444248252445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,16384,0.0714977780977885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,51200,0.3805564509497748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,65536,0.4815066655476888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,16384,0.128694216410319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,12288,0.018927110566033255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,10240,0.016694222887357075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,8192,0.01401511165830824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,12288,0.054550220568974815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,12288,0.10167466931872898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,10240,0.08856978019078572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,10240,0.045829332537121244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,7168,0.012825777961148156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,6144,0.01145244472556644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,8192,0.03784711162249247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1536,256,0.012753778033786349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,8192,0.07482844591140747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,7168,0.06909066438674927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,7168,0.03449599941571554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,5120,0.010199111368921068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,4096,0.008627555436558193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,6144,0.030864887767367895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,6144,0.06215555800331963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,3584,0.007832888927724626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,5120,0.0550817781024509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,5120,0.027458666099442378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,3072,0.006983111302057902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,4096,0.04793688986036512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,3584,0.021793777743975323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,3584,0.04345155424541897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,3072,0.03973866502443949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,2048,0.005633777628342311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,2560,0.018887110882335238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1536,1536,0.030084444416893855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,1536,0.004920888692140579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,2048,0.016174222032229107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,2048,0.03331289026472304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,1024,0.004234666625658671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,1536,0.015235554840829639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,1024,0.013749333719412485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,1024,0.027073777384228174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,768,0.013071111506885953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,768,0.02574933403068119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,512,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,4096,0.02367199957370758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,512,0.012563555604881711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,2560,0.006572444405820634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,256,0.003206222214632564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,512,0.025049777494536504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,3072,0.020256888535287645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,128,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,2560,0.03733777668741014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,256,0.022983110613293115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,256,0.012073777616024017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,64,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,32,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,128,0.02159822152720557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,65536,0.04679377873738607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,64,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,32,0.012087999946541257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,51200,0.037921776374181114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,1024,1536,0.030023998684353296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,16384,0.01720711092154185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,1024,768,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,65536,0.28551112280951607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,12288,0.016183111402723525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,16384,0.07058666812049018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,51200,0.22150933742523193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,10240,0.014449778530332776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,16384,0.12810222307840982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,12288,0.053555554813808866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,51200,0.3788782225714789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,65536,0.4792666435241699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,12288,0.10070311360889012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,8192,0.013051555388503604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,7168,0.012692444854312472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,10240,0.08831910954581366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,6144,0.010958222051461538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,8192,0.07462400197982788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,7168,0.06835466623306274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,7168,0.034295111894607544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,5120,0.009642666412724389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,6144,0.030615111192067463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,6144,0.061829335159725614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,4096,0.008055110772450766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,5120,0.05379288726382785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,3584,0.007647111184067196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,1024,128,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,4096,0.02331466641690996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,4096,0.04554222358597649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,3072,0.0069777775141927935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,3584,0.02165066699186961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,3584,0.042613334125942655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,2560,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,3072,0.020241777102152508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,3072,0.0398595564895206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,2048,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,2560,0.018544000056054857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,2560,0.037103109889560275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,1536,0.005165333135260476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,2048,0.03306488858328925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,2048,0.016415999995337594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,1024,0.004581333448489507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,1536,0.01482399966981676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,1536,0.030010667112138536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,768,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,1024,0.013432888521088494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,10240,0.04558933443493313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,512,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,768,0.01276088919904497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,768,0.025841777523358662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,256,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,8192,0.03764266769091288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,512,0.02365422248840332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,512,0.012771555946932899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,128,0.0032248888164758682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,256,0.01202222208182017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,64,0.003144888828198115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,128,0.02126844392882453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,5120,0.027087999714745417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,768,32,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,64,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,65536,0.03518133362134298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,32,0.011702222128709158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,51200,0.028520888752407495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,65536,0.2841973304748535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,16384,0.014813333749771118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,51200,0.22397332721286348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,65536,0.4786071247524685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,16384,0.07001777489980061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,51200,0.37705334027608234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,12288,0.012786666552225748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,1024,0.027087999714745417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,10240,0.014173333843549093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,16384,0.1279360055923462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,8192,0.013411555853154926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,12288,0.05233600073390537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,10240,0.08795999818378025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,10240,0.044362667534086436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,7168,0.0120328888297081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,768,256,0.023230221536424425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,8192,0.03725333346260919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,8192,0.0739555557568868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,6144,0.010632889138327705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,5120,0.009300444689061906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,768,128,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,7168,0.03360266817940606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,7168,0.06844977537790935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,4096,0.007992000215583378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,6144,0.0614008903503418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,3584,0.007253333098358578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,5120,0.027423111928833857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,4096,0.02315644423166911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,4096,0.04549422197871738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,3072,0.006865777903132969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,3584,0.02160444524553087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,2560,0.006203555398517185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,3072,0.02017688916789161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,3072,0.039670222335391574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,2048,0.005550222264395819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,2560,0.018227555685573153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,2560,0.03706577751371596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,1536,0.004927111168702443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,2048,0.01625688870747884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,2048,0.03258488906754388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,1024,0.0041751112374994485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,1536,0.01495911180973053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,1536,0.02968533171547784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,768,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,12288,0.100490669409434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,1024,0.013110222087966071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,1024,0.027106665902667578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,512,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,768,0.01278133359220293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,256,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,512,0.024098666177855596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,256,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,6144,0.029847111966874864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,128,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,5120,0.052905778090159096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,128,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,128,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,512,32,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,3584,0.042825778325398765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,65536,0.024120888776249353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,64,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,51200,0.019877332780096266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,65536,0.2842782338460286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,51200,0.21910044882032606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,16384,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,65536,0.47822931077745223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,16384,0.06522755490409003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,768,0.026085333691702947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,16384,0.12783911493089464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,51200,0.37772711118062335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,12288,0.012723555167516073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,512,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,10240,0.011808888779746162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,8192,0.010327999790509542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,512,256,0.02332266668478648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,10240,0.0433884428607093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,10240,0.08808444605933295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,7168,0.00965244405799442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,8192,0.03672800130314297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,8192,0.0734986662864685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,6144,0.009009777671760982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,7168,0.03371822171741062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,5120,0.008346666892369589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,512,32,0.011657777759763928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,6144,0.029158221350775823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,4096,0.007584888901975419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,5120,0.026748443643252056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,4096,0.022960889670583937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,3584,0.006962666908899943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,4096,0.04557244314087761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,3584,0.021331555313534204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,3584,0.04244355691803826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,3072,0.006256000035338932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,12288,0.05134488807784187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,2560,0.005873777800136142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,3072,0.019907555646366544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,3072,0.04007644454638163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,2048,0.005246222019195557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,2560,0.037104888094796076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,2560,0.018544889158672757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,7168,0.06584178076850043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,1536,0.004589333302444882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,2048,0.016192000773217943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,6144,0.059189332856072314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,2048,0.0329368876086341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,1536,0.014787554740905762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,1536,0.029550221231248643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,768,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,5120,0.05243733194139269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,1024,0.01313688854376475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,1024,0.027287999788920086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,512,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,256,0.0032071111102898917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,768,0.02570488883389367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,512,0.02438755498992072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,512,0.01238222254647149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,128,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,256,0.022064889470736187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,64,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,128,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,128,0.021724444296624925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,32,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,65536,0.0181377778450648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,64,0.011423110961914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,32,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,51200,0.014883556299739413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,256,12288,0.10070221953921848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,65536,0.28384799427456325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,16384,0.009956444303194681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,51200,0.22301244735717773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,65536,0.4770000245836046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,256,1024,0.004173333446184794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,12288,0.00869333330127928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,16384,0.06828622023264568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,51200,0.37820710076226133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,16384,0.12785511546664768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,10240,0.009323555562231276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,8192,0.00831200016869439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,12288,0.050660444630516895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,12288,0.10005688667297363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,768,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,7168,0.00793688909875022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,10240,0.08579199843936497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,8192,0.03549155592918396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,6144,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,8192,0.07197866837183635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,7168,0.03273866573969523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,7168,0.06583999925189547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,5120,0.007979555262459649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,4096,0.007613333563009898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,6144,0.029245333539115057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,5120,0.052383999029795326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,3584,0.0069546666410234236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,4096,0.023000000251664057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,4096,0.04516977734035916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,3072,0.006222222414281633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,3584,0.02127911150455475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,3072,0.01963733302222358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,2560,0.0057946667075157166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,3072,0.039240890079074435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,2560,0.018187556001875136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,2048,0.005218666460778978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,2048,0.015807999504937064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,10240,0.042655110359191895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,1536,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,256,256,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,2048,0.03230488962597317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,1024,0.0038720000949170855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,1536,0.01479111115137736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,6144,0.059170663356781006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,1536,0.029470221863852605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,768,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,5120,0.02658133374320136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,1024,0.013091555900043912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,1024,0.026781333817376032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,512,0.0034933334423436057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,256,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,768,0.012416000167528788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,768,0.026385777526431616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,128,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,512,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,3584,0.042500442928738065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,256,0.021607110897699993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,64,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,128,0.020720889170964558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,128,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,65536,0.01626311077011956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,64,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,51200,0.013832000394662222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,32,0.011067555182509951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,2560,0.03645955522855123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,16384,0.009720000127951304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,12288,0.008287111090289222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,65536,0.2836586634318034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,10240,0.008970666262838576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,51200,0.22278756565517852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,8192,0.008245333201355403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,12288,0.05036711030536228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,7168,0.007928888830873702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,10240,0.04203822215398153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,6144,0.007278222176763747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,8192,0.03571555680698819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,5120,0.008016889293988546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,7168,0.03261422117551168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,4096,0.0076044441925154785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,6144,0.029471112622155085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,3584,0.006958222223652734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,5120,0.026399999856948853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,512,128,512,0.023316444622145757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,3072,0.006638222270541721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,4096,0.02295822236273024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,2560,0.006259555617968242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,128,256,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,2048,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,3584,0.021198223034540813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,1536,0.004541333350870344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,128,32,0.002805333377586471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,3072,0.019613333874278598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,2560,0.01825066738658481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,768,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,512,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,1536,0.01482311056719886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,256,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,1024,0.013454222016864352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,768,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,128,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,512,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,64,0.0025155554629034465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,32,0.002569777684079276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,256,0.01184800018866857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,128,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,65536,0.028132445282406274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,64,0.01131199962562985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,16384,0.06839999887678358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,51200,0.02292088833120134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,32,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,16384,0.009292444421185387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,12288,0.008671999805503422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,10240,0.00797333319981893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,16384,0.06824533144632976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,12288,0.050592889388402305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,8192,0.008274666965007782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,65536,0.28339823087056476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,51200,0.22270578808254668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,7168,0.007991111112965478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,10240,0.04239644606908163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,6144,0.007320889168315464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,5120,0.007000000112586551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,4096,0.007676444119877285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,8192,0.03523733218510946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,7168,0.032617777585983276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,6144,0.029482665989134047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,3584,0.007251555720965068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,5120,0.026406221919589575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,3072,0.006983111302057902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,2560,0.006367110957702001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,4096,0.022721777359644573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,2048,0.006315555423498154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,3584,0.0210533340771993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,3072,0.019267555740144517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,64,1024,0.0038444445365005066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,2560,0.018236445056067575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,768,0.003544888976547453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,2048,0.016176889340082806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,64,2048,0.016145777371194627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,512,0.0031884445084465873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,1536,0.014481777946154276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,256,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,1024,0.012860444684823355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,128,0.0028497777465316984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,768,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,512,0.012119111087587146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,256,0.011420444481902652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,32,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,128,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,64,0.011779555843936073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,512,32,32,0.011009777585665384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,16384,0.3997742335001628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,16384,0.45194043053521055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,1536,0.004513777792453766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,12288,0.3147288958231608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,1024,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,512,32,64,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,12288,0.33014488220214844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,10240,0.27858487764994305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,8192,0.23390844133165148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,51200,1.31569152408176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,10240,0.28344800737169057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,7168,0.2003493309020996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,8192,0.22404445542229545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,51200,1.455466694302029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,7168,0.19713332917955187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,5120,0.14816533194647893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,4096,0.12458044952816433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,5120,0.14583110809326172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,3584,0.10774577988518609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,4096,0.11893599563174778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,6144,0.21116356054941812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,3072,0.09377066956626044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,2560,0.0783991085158454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,3584,0.10639644331402248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,2048,0.06605688730875652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,3072,0.09253422419230144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,1024,0.03814844290415446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,1536,0.05174933208359612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,768,0.031010667483011883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,2048,0.06929066446092394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,2560,0.08097600274615817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,512,0.023457777169015672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,256,0.014169777433077494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,1024,0.04548711246914334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,128,0.011737777955002256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,1536,0.05616977479722765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,768,0.03856177793608771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,512,0.03279555506176419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,256,0.02996088729964362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,32,0.01351111133893331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,128,0.028146667612923518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,64,0.02778844369782342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,65536,32,0.027800000376171533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,6144,0.17404445012410483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,16384,0.34702399041917587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,16384,0.35674577289157444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,12288,0.256930669148763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,12288,0.26600533061557347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,10240,0.22437334060668945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,51200,1.0550675921969943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,65536,64,0.010685332947307162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,51200,1.1476622687445748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,8192,0.1747751103507148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,65536,1.3607378005981445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,7168,0.1514684491687351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,10240,0.22448976834615073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,65536,1.432286262512207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,6144,0.13917156060536703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,5120,0.11071999867757161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,7168,0.16017956203884548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,4096,0.09257777531941731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,8192,0.1919342279434204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,3072,0.0708248880174425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,3584,0.08075111442142062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,2560,0.05962489048639933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,3584,0.08672977818383111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,3072,0.07703999678293864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,2560,0.06732622120115492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,6144,0.14284533924526638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,4096,0.10075110859341091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,1536,0.03947644432385763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,1024,0.029599110285441082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,768,0.023716444770495098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,512,0.017668444249365065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,1536,0.047613332668940224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,1024,0.03936355643802219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,768,0.033137778441111244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,256,0.012698666916953193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,128,0.010049777726332346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,2048,0.0573857757780287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,512,0.02792444494035509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,64,0.008489777644475302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,32,0.008632889224423302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,256,0.025748444928063288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,128,0.024047111471494038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,64,0.02407199972205692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,32,0.024060444699393377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,16384,0.10323911243014866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,65536,0.4014151096343994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,51200,0.3121982150607639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,51200,5120,0.11894310845269097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,12288,0.08027022414737277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,16384,0.14129066467285156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,10240,0.07287377781338163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,65536,0.5414649115668403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,8192,0.06120977799097697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,51200,2048,0.04962933394643995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,7168,0.05349422163433499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,12288,0.10651822222603692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,6144,0.04649600055482653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,10240,0.09686488575405544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,5120,0.04018933243221707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,4096,0.03423733181423611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,7168,0.06710133287641737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,6144,0.05955288807551066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,8192,0.07511022355821398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,3584,0.030565334690941706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,3072,0.026546667019526165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,5120,0.05295111073387993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,4096,0.04286488890647888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,2048,0.01863911085658603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,1536,0.014936889211336771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,3584,0.039332442813449435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,3072,0.03569066524505615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,2560,0.03147644466824002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,1024,0.011838222543398539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,2048,0.027468444572554693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,768,0.010034666293197209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,512,0.007972444097201029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,1536,0.023937778340445623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,256,0.005919999960396025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,1024,0.02049066623051961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,128,0.004863111095296012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,768,0.018995554910765756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,64,0.005179555465777715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,512,0.01720266706413693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,32,0.0052133335007561584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,256,0.015992888145976596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,64,0.015462223026487561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,128,0.015822221835454304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,32,0.015125332607163323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,16384,51200,0.4283120102352566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,16384,0.08902311325073242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,65536,0.3017875618404812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,12288,0.0626408921347724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,51200,0.23583645290798613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,10240,0.05214488837454054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,16384,0.11793066395653619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,65536,0.44377512402004665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,51200,0.3424951235453288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,8192,0.043713778257369995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,7168,0.04014399978849623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,10240,0.0768231087260776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,12288,0.09041421943240696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,6144,0.033872889147864446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,5120,0.02949955397182041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,16384,2560,0.022623111804326374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,7168,0.05701511436038547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,4096,0.025273778372340735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,3072,0.01940533353222741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,6144,0.05184266633457608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,5120,0.04628355635537041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,2560,0.017077333397335477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,4096,0.03639111253950331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,2048,0.01481599940194024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,1536,0.012072888513406118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,3072,0.030006223254733618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,2560,0.027241778042581346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,1024,0.010015111002657149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,2048,0.024344000551435683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,768,0.0087333329849773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,1536,0.021594666772418555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,512,0.007254222200976477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,256,0.005555555638339784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,1024,0.01888799998495314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,768,0.017415111263593037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,128,0.004635555462704765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,512,0.01570577753914727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,256,0.015145777000321282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,32,0.004561777744028303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,128,0.014451555079884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,64,0.0144195556640625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,32,0.014091556270917257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,65536,0.28122221099005806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,51200,0.2295431031121148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,8192,0.06345066759321424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,3584,0.02221333318286472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,65536,0.39402132564120823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,12288,3584,0.03420622150103251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,51200,0.30305422676934135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,16384,0.10618578063117133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,10240,0.04988622334268358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,12288,0.08090311288833618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,8192,0.04167377617624071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,7168,0.03641422258483039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,6144,0.03222844335767958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,10240,0.06983288791444567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,8192,0.05775644381841024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,5120,0.02763644523090786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,7168,0.05221066541141934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,4096,0.02352977792421977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,12288,64,0.004458666675620609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,3584,0.020869332883093093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,6144,0.04698488778538174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,5120,0.040856000449922346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,3072,0.01829155617290073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,2560,0.015829333000712924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,2048,0.013796444568369122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,3584,0.030693332354227703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,1536,0.01185955521133211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,3072,0.027905778752432928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,2560,0.02552622225549486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,1024,0.010551999840471478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,2048,0.022989332675933838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,768,0.00869599978129069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,1536,0.02029511166943444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,512,0.006896889044178857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,1024,0.017516444126764934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,256,0.005215999980767568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,128,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,768,0.016525333126386006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,512,0.015446222490734525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,64,0.004556444370084339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,16384,0.07435822486877441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,256,0.014466666513019137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,128,0.013821333646774292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,32,0.004567111117972268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,10240,12288,0.05817244450251261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,64,0.014125333891974555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,32,0.013411555853154926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,65536,0.252092440923055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,16384,0.06495733393563165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,51200,0.19029333856370714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,12288,0.05082755618625217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,10240,0.04264355699221293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,65536,0.3476693365308974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,51200,0.26728089650472003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,16384,0.09416977564493816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,8192,0.03592177894380357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,7168,0.031650665733549334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,12288,0.07245066430833605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,10240,4096,0.032884445455339216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,6144,0.028039998478359644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,8192,0.052367998494042285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,5120,0.02385422256257799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,7168,0.046896000703175865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,4096,0.019863999552196927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,3584,0.01776355504989624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,5120,0.03639377819167243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,3072,0.015501333607567681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,4096,0.029971556531058416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,2560,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,2048,0.011695110963450538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,3584,0.02801688843303257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,1536,0.009681777821646797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,3072,0.025654221574465435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,2560,0.023349333140585158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,1024,0.008107555409272512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,2048,0.021074665917290583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,768,0.006511999915043513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,512,0.005274666680230035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,1536,0.018964444597562153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,256,0.0042275554604000514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,1024,0.016198222835858662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,768,0.015463110473420886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,128,0.0039022221333450745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,512,0.0148026661740409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,64,0.004058666527271271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,256,0.014144889182514615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,8192,32,0.004204444587230682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,128,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,64,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,32,0.013070222404268054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,16384,0.06229066848754883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,51200,0.1852924426396688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,10240,0.06289866897794935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,12288,0.048876444498697914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,65536,0.31100622812906903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,51200,0.2418151166703966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,10240,0.04089955488840739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,16384,0.08409777614805435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,8192,0.03442488776312934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,7168,0.030377778742048476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,8192,6144,0.04141511188613044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,12288,0.06486577457851835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,6144,0.026550221774313185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,10240,0.056699554125467934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,5120,0.02257866660753886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,7168,0.04196711050139534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,3584,0.016910221841600206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,6144,0.03748355640305413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,5120,0.03293244375122918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,3072,0.015067555838161044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,4096,0.027659555276234944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,2560,0.013230221966902414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,3584,0.025757332642873127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,3072,0.02388266722361247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,1536,0.009647111097971598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,2560,0.022022222479184467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,1024,0.007603555917739868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,2048,0.019663110375404358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,768,0.006220444622966979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,1536,0.017549332645204332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,512,0.005208888815508948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,768,0.015127999915017022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,256,0.00490133340160052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,512,0.014152889450391134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,128,0.0042035554846127825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,256,0.01365066650840971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,64,0.003826666623353958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,128,0.01312711089849472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,32,0.003908444609906939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,64,0.013080000049538083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,8192,0.04656177759170532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,4096,0.019105777144432068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,32,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,65536,0.22067022323608398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,51200,0.1513813336690267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,2048,0.011520889070298938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,16384,0.052928000688552856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,12288,0.040896889236238264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,65536,0.3001946608225505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,51200,0.23070043987698027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,10240,0.03546222382121616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,12288,0.06386488676071167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,16384,0.0825857785012987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,7168,0.025395555628670588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,10240,0.055283556381861367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,6144,0.023219555616378784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,8192,0.04662933283381992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,5120,0.01993333299954732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,7168,0.040932443406846784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,4096,0.016136000553766888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,6144,0.036469333701663546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,3584,0.014653333359294467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,5120,0.032630221711264715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,3072,0.013571555415789286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,4096,0.02711822258101569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,3584,0.025249777568711176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,2560,0.011242667006121742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,2048,0.010008888940016428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,3072,0.023668444818920557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,1536,0.008832000195980072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,2560,0.021560000048743352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,1024,0.006969778074158563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,1536,0.017196445001496207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,768,0.0058408888677755995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,1024,0.015141333142916361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,512,0.004870222260554631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,768,0.014789332946141561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,8192,0.029321776496039495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,512,0.01391999920209249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,7168,1024,0.015523556205961438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,256,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,64,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,32,0.0035439998739295532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,7168,65536,0.23616978857252333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,128,0.012799999780125089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,64,0.012903110848532783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,32,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,65536,0.18841066625383165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,51200,0.1501306692759196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,16384,0.05067911081843906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,65536,0.26129065619574654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,12288,0.03977600071165297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,51200,0.20464000436994764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,16384,0.0728915532430013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,10240,0.033632887734307185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,8192,0.02846755584081014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,12288,0.05598666932847765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,7168,0.025179555018742878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,10240,0.0483511123392317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,6144,0.021993777818149988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,5120,0.018569777409235638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,8192,0.03983022107018365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,7168,0.03566311134232415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,4096,0.015475556254386902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,3584,0.013969777358902825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,6144,0.032637334532207914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,256,0.004184000194072723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,5120,0.029177778297000464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,3072,0.012688889271683164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,2560,0.011346666349305047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,6144,128,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,2048,0.009880888793203566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,3584,0.023232888844278123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,1536,0.008277333445019191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,3072,0.021606221795082092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,1024,0.006298666612969504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,768,0.005211555709441503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,2560,0.01998133295112186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,1536,0.01591822173860338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,512,0.004671999977694618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,1024,0.014686221877733866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,256,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,128,0.003489777859714296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,768,0.014447111222479077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,64,0.0035546666218174826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,512,0.013795555465751223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,256,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,128,0.012899555265903473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,5120,32,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,64,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,32,0.0124195557501581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,65536,0.1485475566652086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,51200,0.11942488617367214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,16384,0.03900977638032701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,12288,0.030284444491068523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,6144,2048,0.019331556227472093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,10240,0.02595377796226078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,8192,0.021687999367713928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,65536,0.2539795504675971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,16384,0.07096978028615315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,7168,0.018623110320832994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,12288,0.05355822377734714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,10240,0.04664444592263964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,6144,0.01623288955953386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,5120,0.014434667097197639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,8192,0.038400888442993164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,7168,0.03490577803717719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,4096,0.0127697777416971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,6144,0.03166133496496413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,3584,0.011511999699804517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,3072,0.010383110907342698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,4096,0.02472977836926778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,4096,0.02438666588730282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,2560,0.009299555586444007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,3584,0.022817777262793645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,2048,0.007962666451931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,1536,0.006803555621041193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,3072,0.020870221985710993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,1024,0.005547555370463266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,2560,0.01902311046918233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,2048,0.01717333330048455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,768,0.00490488898422983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,1536,0.015799111790127225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,512,0.004547555413511065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,256,0.0038622220357259116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,768,0.014149333039919535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,512,0.013429332938459186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,128,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,64,0.0034026667061779234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,128,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,4096,32,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,32,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,51200,0.1968595584233602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,65536,0.1271244419945611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,5120,0.02871111035346985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,51200,0.10280622376335992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,65536,0.21877333852979872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,16384,0.042591998974482216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,5120,2048,0.01718311177359687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,12288,0.02932888931698269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,16384,0.06115200122197469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,10240,0.024479111035664875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,51200,0.1712284485499064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,8192,0.020522667302025687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,1024,0.01444355481200748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,7168,0.018567999203999836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,12288,0.04634311132960849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,6144,0.016233777006467182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,10240,0.04014666544066535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,5120,0.01427111029624939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,4096,0.012500444220172035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,256,0.013117333253224691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,7168,0.030974222554100886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,6144,0.028220444917678833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,3584,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,3072,0.01036888857682546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,5120,0.025826666090223525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,2560,0.009294222626421187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,4096,0.021987555755509272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,4096,64,0.012694222231705984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,2048,0.009308444129096137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,3584,0.020560888780487906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,1536,0.007655111451943715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,1024,0.006228444476922353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,2560,0.017217778497272067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,768,0.00554666668176651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,2048,0.015808888607554965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,1536,0.01479022204875946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,256,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,1024,0.013775111072593264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,128,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,768,0.013585777746306526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,512,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,64,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,256,0.012457778056462606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,32,0.0032293332947625052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,128,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,64,0.012064889073371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,65536,0.111044446627299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,32,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,51200,0.08461422390407985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,16384,0.03354933195643955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,12288,0.02760266595416599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,65536,0.21488444010416666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,16384,0.059919999705420605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,10240,0.024540444215138752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,51200,0.16484533415900335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,8192,0.020603555772039626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,7168,0.01716800034046173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,8192,0.033766223324669734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,12288,0.046353777249654136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,6144,0.016182222300105624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,5120,0.013722666435771518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,10240,0.03968000080850389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,8192,0.033492445945739746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,4096,0.012030222349696688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,7168,0.03075288732846578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,3584,0.010990222295125326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,6144,0.028276443481445312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,3072,0.009988444546858469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,5120,0.025631111529138353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,2560,0.009308444129096137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,2048,0.008260444634490544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,4096,0.02123111155298021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3584,3072,0.018793778287039865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,3072,0.0188711103465822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,1024,0.005255110975768831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,2560,0.01716977854569753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,2048,0.015803555647532146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3584,512,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,1536,0.014647111296653748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,512,0.0038897775941424896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,1024,0.013798221945762634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,256,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,768,0.013439999686347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,128,0.0035004446076022256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,512,0.01311822235584259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,64,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,32,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,256,0.012494222157531314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,128,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,64,0.012094222009181976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,65536,0.0914720031950209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,32,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,51200,0.07442133294211493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,65536,0.21011911498175728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,51200,0.1622462272644043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,12288,0.025992888543340895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,16384,0.05755111243989733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,10240,0.021135111649831135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,8192,0.0177839994430542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,12288,0.04452355702718099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,10240,0.038986666334999934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,7168,0.016136000553766888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,8192,0.032877332634396024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,6144,0.014475555883513557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,3072,3584,0.019894222418467205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,5120,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,4096,0.010671999719407825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,768,0.00461422238085005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,6144,0.0281368891398112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,3584,0.009678222239017487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,5120,0.024715556038750544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,3072,0.009124444590674506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,4096,0.020920000142521326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,2560,0.00850577818022834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,2048,0.00721777809990777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,3584,0.019271110494931538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,3072,0.017862222260899015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,1536,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,2560,0.016895999511082966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,1024,0.005223999834722943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,768,0.004586666822433472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,2048,0.015844444433848064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,512,0.004208000169859992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,1536,0.014444443914625378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,1024,0.013460444079505073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,256,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,16384,0.03137600090768602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,128,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,64,0.0032044444233179092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,512,0.013157332936922709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,256,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2560,32,0.0033200000309281876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,128,0.012119111087587146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,64,0.011760888828171624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,65536,0.07626044750213623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,32,0.011696000066068439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,51200,0.05951288673612806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,16384,0.02476177778508928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,12288,0.02086044516828325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,65536,0.2073191139433119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,51200,0.15960444344414607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,3072,1536,0.006624889042642381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,16384,0.05589955382876926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,10240,0.02166044380929735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,7168,0.030220445659425523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,12288,0.04349955585267809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,7168,0.016383111476898193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,6144,0.014827556080288358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,10240,0.03836977812978957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,5120,0.013044444223244986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,7168,0.029959999852710303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,4096,0.0111191107167138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,6144,0.02745955520206028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,3584,0.009160888691743216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,3072,0.00792622235086229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,5120,0.02409511142306858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,4096,0.019874667127927143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,2560,0.0069288888739215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,3584,0.019260444574885897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,2048,0.006132444573773279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,3072,0.017872000734011333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,1536,0.0052435555391841466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,1024,0.004553777890072929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,2560,0.016812443733215332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,2048,0.015684444043371413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,768,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,1536,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,512,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,1024,0.013779555757840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,256,0.0034719999465677473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,128,0.0032035555276605818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,768,0.013529777526855469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,64,0.0031519999934567344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,256,0.012456888953844706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,128,0.01202666676706738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,32,0.0028497777465316984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,64,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,65536,0.059752000702752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,32,0.01145244472556644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,51200,0.04875555634498596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,2048,8192,0.01817244456874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,65536,0.1672017839219835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,16384,0.020245333512624104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,12288,0.016880000631014507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,8192,0.03235466612709893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,10240,0.01776000029510922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,51200,0.12855554951561823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,16384,0.0450853341155582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,8192,0.015471999843915304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,12288,0.035635554128222995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,7168,0.013393777940008374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,6144,0.012348444097571902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,10240,0.032171554035610624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,5120,0.011807111402352652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,8192,0.027494221925735474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,4096,0.009988444546858469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,7168,0.025408888856569927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,3584,0.008371555142932469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,6144,0.022346667117542688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,3072,0.007855999800893996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,2560,0.006962666908899943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,4096,0.01772533357143402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2560,768,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,3584,0.017179555363125272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,2048,0.006259555617968242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,1536,0.0052328887912962176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,3072,0.015857777661747403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,1024,0.004561777744028303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,2560,0.015404444601800708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,768,0.004247111164861255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,2048,0.014283556077215405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,512,0.003567111161020067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,1536,0.013451555536852943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,256,0.0032462223122517266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,2048,512,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,1024,0.012736000120639801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,128,0.0032044444233179092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,768,0.013075555364290873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,64,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1536,32,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,512,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,256,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,65536,0.043599999613232084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,64,0.011800888511869641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,32,0.011415999796655444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,51200,0.035466667678621076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,16384,0.016210666961140104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,12288,0.014132445057233175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,10240,0.013960000541475085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,65536,0.16468800438774958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,16384,0.043288889858457774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,51200,0.1259982188542684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,8192,0.012390221986505719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,7168,0.012478222449620565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,6144,0.011047110789351992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,10240,0.031176888280444678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,5120,0.009631111390060848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,8192,0.02642755541536543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,7168,0.024513777759340074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,4096,0.008096888661384583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,6144,0.02204799983236525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,5120,0.020132443971104093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,3072,0.0069191112286514705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,4096,0.01756355497572157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,5120,0.020582222276263766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,2560,0.006259555617968242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,2048,0.005561777700980504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,3072,0.015855110353893705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,1536,0.00490399988161193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,2560,0.014910222755538093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,2048,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,1024,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,768,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,1536,0.01344622257683012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,512,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,1024,0.012747555143303342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,256,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1536,128,0.011748444702890186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,128,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,512,0.012430222498046027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,64,0.0028453332682450614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,256,0.012025777664449481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,32,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,128,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,65536,0.034576889541414045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,12288,0.035516444179746844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,32,0.011424889167149862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,51200,0.02810844447877672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,16384,0.01443555619981554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,1024,3584,0.007657777931955125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,65536,0.16304977734883627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,51200,0.12463200092315674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,12288,0.012877333495352002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,16384,0.04344800114631653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,10240,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,8192,0.010647999743620554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,3584,0.01682044400109185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,7168,0.012698666916953193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,12288,0.03502577874395583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,6144,0.010746666954623329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,10240,0.030543999539481267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,8192,0.026168000366952684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,5120,0.009333333207501305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,4096,0.007993777592976889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,7168,0.023888889286253188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,3584,0.007328888608349695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,6144,0.021903110875023737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,3072,0.006634666687912411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,4096,0.01735911104414198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,2560,0.006219555520349079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,768,0.0127688886390792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,3072,0.01581333412064446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,2048,0.005264889034960005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,1536,0.005056888692908817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,2560,0.014944000376595391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,1024,0.0041848888827694785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,2048,0.013878222141000958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,768,0.0038648889296584656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,1024,64,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,512,0.0034835553831524322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,1024,0.012749333348539142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,768,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,512,0.012364444633324942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,128,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,256,0.01181244436237547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,64,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,128,0.011681777735551199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,32,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,64,0.011483555866612328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,65536,0.02604177759753333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,32,0.011175110936164856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,51200,0.022996443841192458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,5120,0.020262221495310467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,16384,0.014478221535682678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,3584,0.016979555288950603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,65536,0.16242133246527776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,12288,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,10240,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,51200,0.12319910526275635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,8192,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,7168,0.010047111246320937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,10240,0.03020355436537001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,12288,0.03392622205946181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,768,1536,0.013407111167907715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,6144,0.009345778160625035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,5120,0.009215110705958473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,7168,0.023710222707854375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,4096,0.007656888829337225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,3584,0.007248889240953658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,768,256,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,5120,0.020084444019529555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,3072,0.006614222294754452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,4096,0.01753155555990007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,3584,0.016837333639462788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,2048,0.005208888815508948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,2560,0.01478488908873664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,1536,0.004874666531880696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,2048,0.013891556196742587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,1024,0.00388711111413108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,1536,0.013426666458447775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,768,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,1024,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,512,0.0035422220826148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,768,0.01275111072593265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,256,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,512,0.012101333174440594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,16384,0.04258666767014397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,128,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,64,0.0025128889828920364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,256,0.011779555843936073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,32,0.0026480000880029467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,8192,0.025382222400771245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,128,0.011404444773991903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,65536,0.02357599967055851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,64,0.011411555939250521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,51200,0.02008888953261905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,6144,0.021993777818149988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,16384,0.011043555206722684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,32,0.011257777611414591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,12288,0.010335110955768162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,512,2560,0.005896889087226655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,10240,0.009686222506894005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,65536,0.15900088681115046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,8192,0.010127999716334874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,512,3072,0.015855999456511605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,16384,0.041514668199751116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,12288,0.03310044606526693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,6144,0.0090515555606948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,10240,0.029398222764333088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,8192,0.025370667378107708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,5120,0.008954666554927826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,4096,0.007616000043021307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,6144,0.021664000219768945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,3584,0.007269333634111617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,3072,0.00658044425977601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,5120,0.019714666737450492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,2560,0.0059057776298787855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,3584,0.016513778103722464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,3072,0.015828443898095023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,2048,0.005232000102599462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,2560,0.014818666709793938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,1536,0.004531555705600315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,2048,0.013763555222087435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,1024,0.0038986665507157645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,1536,0.013184000220563678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,768,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,1024,0.012697777814335294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,512,0.0032239999208185407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,768,0.012429333395428128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,256,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,512,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,51200,0.12134222189585368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,128,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,7168,0.009722666607962714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,64,0.0028106667515304354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,256,32,0.0028026666906144884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,128,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,64,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,65536,0.01608000033431583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,32,0.011357333097192975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,51200,0.014075555735164218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,4096,0.017536888519922893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,16384,0.00999022192425198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,12288,0.012131555212868584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,10240,0.011109333071443768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,51200,0.12133777141571045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,16384,0.04054222173160977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,12288,0.0328764451874627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,8192,0.009988444546858469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,7168,0.009352888498041365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,10240,0.029566221767001685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,6144,0.008640000389681922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,5120,0.008039111064540016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,8192,0.02529511186811659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,7168,0.023369777533743117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,4096,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,6144,0.021648888786633808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,3584,0.006909333169460297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,5120,0.019609777463806998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,3072,0.006268444574541516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,4096,0.017232000827789307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,2560,0.005586666779385672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,2048,0.004911111046870549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,3584,0.01686755485004849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,1536,0.004613333278232151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,2560,0.014833778142929077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,1024,0.00396799999806616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,2048,0.013797333670987023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,768,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,256,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,512,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,1024,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,256,7168,0.02350933353106181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,256,0.00314666661951277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,768,0.012481778032249875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,128,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,64,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,256,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,128,0.011391110718250275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,128,32,0.002529777793420686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,65536,0.160407993528578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,65536,0.01478666729397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,51200,0.02235288918018341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,32,0.011400889191362592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,16384,0.00941244430012173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,65536,0.16005333264668783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,51200,0.12127555741204156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,16384,0.04038666685422262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,10240,0.009022222624884712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,12288,0.03292977809906006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,8192,0.008302222523424361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,3072,0.015466666883892484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,7168,0.009019555317031013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,8192,0.02537600033813053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,1536,0.013456888496875763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,6144,0.008637333081828224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,5120,0.007664889097213745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,7168,0.02344177828894721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,4096,0.007387555307812161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,6144,0.02164799968401591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,512,0.012084444363911947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,3584,0.0069644442862934535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,5120,0.019895111521085102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,3072,0.006276444428496891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,4096,0.016951110627916124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,2560,0.005584888988071018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,128,64,0.011382222175598145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,3584,0.01627377834584978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,1536,0.0042364444169733255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,3072,0.015807999504937064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,1024,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,2048,0.013760888742076026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,768,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,1536,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,512,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,1024,0.01274400038851632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,12288,0.009681777821646797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,768,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,512,0.012075555821259817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,128,0.0028479999552170434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,256,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,64,0.002532444480392668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,10240,0.029398222764333088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,32,0.002798222212327851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,64,0.011361777782440186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,65536,0.01648888819747501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,32,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,51200,0.023967110448413428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,65536,0.15888978375328913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,16384,0.015513777732849121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,51200,0.11961155467563206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,12288,0.01313244468635983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,10240,0.012063110868136087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,2560,0.014544889330863953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,16384,0.03983733389112685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,8192,0.00833155545923445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,12288,0.03271111183696323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,7168,0.00867733359336853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,6144,0.008626666333940294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,10240,0.029469334416919287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,8192,0.025009777810838487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,256,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,5120,0.007629333270920648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,7168,0.02335022224320306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,4096,0.007592889169851939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,3584,0.006612444503439798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,6144,0.02132355504565769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,3072,0.006215999937719769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,2560,0.005594666633341048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,4096,0.017234666479958426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,3584,0.016538666354285348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,2048,0.004881777697139316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,1536,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,3072,0.015446222490734525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,64,128,0.011352000137170156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,2560,0.014838222000333997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,768,0.0036231109665499795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,2048,0.013930666777822705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,512,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,1024,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,768,0.012601777911186218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,512,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,128,0.0025315555847353404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,256,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,64,0.002536888958679305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,64,2048,0.0052355556852287715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,128,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,32,0.0025333333760499954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,64,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,32,0.011552888486120435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,5120,0.01958044370015462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,1024,0.0038933331767717996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,257,32,1536,0.01310400002532535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,257,32,256,0.002995555599530538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,16384,0.49371200137668186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,16384,0.37642667028639054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,51200,1.1673591401841905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,12288,0.37881512112087673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,12288,0.28280888663397896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,10240,0.2482924461364746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,51200,1.5273884667290583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,8192,0.2015519936879476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,10240,0.23733777470058867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,7168,0.1676959991455078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,8192,0.1793688933054606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,10240,0.22156977653503418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,12288,0.26178844769795734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,16384,0.3447599940829807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,6144,0.15951555305057102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,5120,0.13343466652764216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,8192,0.19304711288876006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,7168,0.16052444775899252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,4096,0.10770844750934178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,4096,0.10222222407658894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,5120,0.12432000372144912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,3584,0.09396355681949192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,6144,0.13983644379509821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,3072,0.08886044555240208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,3584,0.09023555782106187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,4096,0.10152800215615167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,5120,0.12213244703080918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,3072,0.07959200276268853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,2560,0.06815377871195476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,3584,0.09275466865963405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,2048,0.05639555719163683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,2560,0.0706640018357171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,3072,0.0839573343594869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,1536,0.04528622163666619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,6144,0.14773421817355686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,7168,0.17818755573696562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,1024,0.034126222133636475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,2560,0.07566933499442206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,1536,0.04953155583805508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,768,0.02642755541536543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,2048,0.06640444199244182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,1536,0.058027558856540255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,512,0.01969688965214623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,1024,0.049992889165878296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,1024,0.04035822219318814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,768,0.045718222856521606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,256,0.012837332983811697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,512,0.029263112280103896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,512,0.04110222061475118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,256,0.03665155503484938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,256,0.025790222816997107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,64,0.009307555854320526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,128,0.02518400053183238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,128,0.03049955434269375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,32,0.00977422214216656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,64,0.024382222029897902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,32,0.02399377855989668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,2048,0.06032622522777981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,65536,768,0.03437066740459866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,65536,128,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,65536,1.1782737308078342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,65536,1.3372507095336914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,65536,51200,1.114023102654351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,51200,1.0401582717895508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,16384,0.33394577768113876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,51200,0.9252266354031033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,16384,0.31095200114780003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,12288,0.25785777303907603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,12288,0.2322453392876519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,10240,0.17517244815826416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,8192,0.1468835539287991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,10240,0.19355555375417074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,8192,0.15695022212134466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,7168,0.12663022677103677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,12288,0.21982133388519287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,10240,0.18608444266849092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,7168,0.13713778389824763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,16384,0.28693511750963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,8192,0.15378310945298937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,6144,0.12512355380588108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,5120,0.09386844767464532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,6144,0.12048444483015273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,4096,0.08700266811582778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,5120,0.10196089082294041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,4096,0.08394933409161037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,7168,0.1376311116748386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,3584,0.0765591131316291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,6144,0.12531288464864096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,3072,0.060138669278886586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,5120,0.10703021950191921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,4096,0.09009955326716106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,3584,0.07440000110202365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,2560,0.051719112528694995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,3072,0.06566666894488864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,2560,0.05864444706175062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,3072,0.0754657785097758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,2560,0.06767111354404025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,1536,0.03250311149491204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,2048,0.05072355601522657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,2048,0.06108178032769097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,1024,0.025754666990704004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,1536,0.04200889004601372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,1536,0.05316266748640272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,1024,0.03465422325664096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,1024,0.04578666554556953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,512,0.014853333433469137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,768,0.028931554820802476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,768,0.041951109965642296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,256,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,512,0.02494311167134179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,512,0.03791911072201199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,128,0.009639999932712978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,256,0.02305511136849721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,128,0.02178222272131178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,64,0.008612444831265343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,128,0.02741688821050856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,3584,0.08261155419879489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,64,0.02159999973244137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,51200,32,0.021280889709790547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,51200,0.9049670961168078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,768,0.01960088809331258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,65536,0.3929911189609104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,65536,0.4700595537821452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,51200,0.30743111504448783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,65536,1.144394662645128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,16384,0.10389955838521321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,51200,256,0.034105777740478516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,12288,0.07897955841488309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,51200,0.3660675684611003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,2048,0.04337333308325874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,10240,0.06829955842759874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,12288,0.09322666459613377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,16384,0.13112444347805446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,8192,0.05685244666205513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,10240,0.08022577895058526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,12288,0.10617955525716145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,16384,0.1335031059053209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,8192,0.0702915522787306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,7168,0.04877688818507724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,10240,0.09331111113230388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,6144,0.042279998461405434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,8192,0.07948355542288886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,5120,0.037618666887283325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,7168,0.07391022311316596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,6144,0.052616887622409396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,6144,0.06707821951972114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,4096,0.030435555511050757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,5120,0.047298666503694325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,5120,0.06020355224609375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,3584,0.027776888675159876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,51200,32,0.009687110781669617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,4096,0.0525857773092058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,51200,0.3800684346093072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,3072,0.02482844392458598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,3584,0.03525155451562669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,3584,0.04977688855595059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,2560,0.020575111111005146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,3072,0.03206933206982083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,65536,0.48884979883829754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,2048,0.017251556118329365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,2560,0.042423999971813627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,1536,0.014087110757827759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,2048,0.02517066730393304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,2048,0.0391226675775316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,1024,0.011167111496130625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,7168,0.05957421991560194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,1536,0.022097777989175584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,1536,0.03559022148450216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,768,0.009743111001120673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,1024,0.019425777925385367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,512,0.008310221963458592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,768,0.017674666312005784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,768,0.030798223283555772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,1024,0.031452443864610456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,256,0.00555644432703654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,512,0.01610488858487871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,512,0.02747111188040839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,128,0.005208888815508948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,256,0.026081777281231348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,256,0.015122666954994202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,64,0.004580444345871608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,16384,32,0.004912000149488449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,4096,0.03832355472776625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,128,0.014667555689811707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,64,0.014507555299335055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,32,0.01480888823668162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,3072,0.04546844296985202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,65536,0.2970808876885308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,16384,2560,0.028119110398822363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,51200,0.23430310355292427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,65536,0.3972880045572917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,16384,0.08393688996632893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,12288,0.06123822265201145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,51200,0.30645865864223903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,16384,0.10685511430104573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,10240,0.05242400036917793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,12288,0.08213422033521864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,10240,0.07081155644522773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,16384,0.1312266720665826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,12288,0.10516177945666844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,8192,0.043848888741599194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,16384,128,0.021665778425004747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,7168,0.0377422206931644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,8192,0.05893955628077189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,10240,0.09224977758195664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,6144,0.033181332879596286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,8192,0.07816000117195977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,7168,0.05194933215777079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,5120,0.029037333197063867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,7168,0.07208444674809773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,6144,0.048285331990983754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,4096,0.02481866710715824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,3584,0.021887999441888597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,5120,0.04138755467202928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,5120,0.05912444326612684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,4096,0.05161688725153605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,3072,0.01924444403913286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,3584,0.03087555699878269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,51200,0.36926934454176163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,2560,0.01645511057641771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,65536,0.47260353300306535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,3072,0.028393778536054824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,3072,0.04422666629155477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,2048,0.013962666193644205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,1536,0.010998222563001843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,2560,0.025422222084469263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,2560,0.041167110204696655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,1024,0.009870222045315636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,2048,0.022648889157507155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,2048,0.03848888807826572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,1536,0.035601778162850276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,1536,0.020242666204770405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,768,0.00835111074977451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,1024,0.03137866655985514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,1024,0.01754399968518151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,768,0.029476443926493328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,256,0.0052133335007561584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,512,0.025711110896534387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,512,0.015154666370815702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,768,0.01648177703221639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,128,0.004856889032655292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,256,0.025349333882331848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,256,0.014155555102560254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,64,0.00452977791428566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,128,0.02163911031352149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,32,0.004517333375083076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,6144,0.06617066595289442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,64,0.013795555465751223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,4096,0.03432000014517043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,12288,3584,0.048272000418768994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,65536,0.22688354386223686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,51200,0.1897519959343804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,65536,0.3531493345896403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,16384,0.06131466892030504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,12288,512,0.006883555402358373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,51200,0.2722382280561659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,12288,0.04918577935960558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,16384,0.09570133023791844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,12288,0.07373155487908258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,128,0.014088888963063559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,16384,0.13012533717685276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,10240,0.04064088728692796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,12288,0.10433599683973525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,8192,0.0351875556839837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,10240,0.06408088737063937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,12288,32,0.01344622257683012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,7168,0.032595554987589516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,8192,0.052842666705449425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,10240,0.09124444590674506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,6144,0.027748444014125403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,8192,0.07768978012932672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,5120,0.023223110371165808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,7168,0.07157155540254381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,6144,0.04359644320276049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,65536,0.4692595799763997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,51200,0.36591378847757977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,4096,0.02019466625319587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,6144,0.06506755616929796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,3584,0.017143999536832173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,5120,0.037808888488345675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,3072,0.015441776977645027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,3584,0.028088887532552082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,4096,0.03077510992685954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,3584,0.046979556481043495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,2560,0.013071111506885953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,3072,0.02609066665172577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,3072,0.04379466507169935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,2048,0.011518222590287527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,2560,0.040983110666275024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,1536,0.009873777627944946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,2048,0.03798222210672166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,2048,0.02131555477778117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,1024,0.008287111090289222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,1536,0.01921422282854716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,1536,0.03444088829888238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,768,0.006622222148709827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,1024,0.029130667448043823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,1024,0.016559999850061204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,512,0.005277333160241445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,768,0.015624889069133334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,768,0.02844266759024726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,7168,0.046145776907602944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,256,0.004521777646409141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,512,0.014440000057220459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,128,0.003903999924659729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,512,0.026039999392297532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,256,0.025719111164410908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,256,0.013749333719412485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,64,0.003909333298603694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,128,0.021719111336602107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,10240,32,0.003919110943873723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,5120,0.059041778246561684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,64,0.01334755536582735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,10240,4096,0.050844444168938525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,32,0.013096888860066732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,65536,0.20453333854675293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,51200,0.15896356105804443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,2560,0.023665777511066858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,16384,0.05540711018774244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,65536,0.30626577801174587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,51200,0.23584887716505262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,16384,0.08467466963662042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,12288,0.06536977820926242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,10240,0.036680890454186335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,12288,0.0810862249798245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,10240,0.05699555741416084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,8192,0.030866665972603693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,10240,0.07148533397250705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,10240,128,0.013144888811641268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,51200,0.2590586609310574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,7168,0.027659555276234944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,65536,0.3289955457051595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,8192,0.046952890025244824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,6144,0.02404088940885332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,8192,0.06031822495990329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,7168,0.04270311196645101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,5120,0.020671111014154222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,7168,0.05645333396063911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,4096,0.01770666738351186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,6144,0.037971556186676025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,3584,0.015198222464985318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,5120,0.03269955515861511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,5120,0.04783644609981113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,4096,0.027446221974160936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,4096,0.041950222518708974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,12288,0.04316533274120755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,3072,0.013785777820481194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,3584,0.03946400019857619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,3584,0.025647999511824712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,2560,0.01219288922018475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,2048,0.010824888944625854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,3072,0.02386933399571313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,3072,0.036665777365366616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,2560,0.03480266531308492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,1536,0.008960000342792934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,2048,0.01983022193113963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,16384,0.09965066777335273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,2048,0.03287200133005778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,1024,0.0070879997478591064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,768,0.005595555735958948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,1536,0.01754844519827101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,1024,0.025974222355418738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,1024,0.015728889240158927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,512,0.004876444323195351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,768,0.014531556102964612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,256,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,512,0.024127999941507976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,512,0.014113777213626437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,128,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,256,0.013254221942689685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,256,0.023774221539497375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,64,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,128,0.013258666627936892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,128,0.020619556307792664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,8192,32,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,6144,0.051981333229276866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,64,0.01274222218328052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,32,0.012597333225939008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,65536,0.18076533741421172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,51200,0.14089066452450222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,65536,0.3022773265838623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,8192,2560,0.021949332621362474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,16384,0.04897955391142103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,51200,0.23288978470696342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,1536,0.03108533223470052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,16384,0.08315110868877836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,12288,0.04071022073427836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,10240,0.03330933385425144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,8192,768,0.025968889395395916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,16384,0.09796533319685195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,12288,0.064246224032508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,8192,0.0281315545241038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,12288,0.08011555671691895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,10240,0.056383113066355385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,7168,0.025119110941886902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,10240,0.0703351100285848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,8192,0.045943111181259155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,6144,0.021464889248212177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,8192,0.05970488654242622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,65536,0.32469601101345485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,7168,0.04138044516245524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,5120,0.018515555395020377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,7168,0.05583822064929538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,6144,0.0370782216389974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,4096,0.015838222371207345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,51200,0.2553013430701362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,6144,0.05176088876194424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,3584,0.014112000664075216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,3072,0.012753778033786349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,5120,0.047563556167814464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,5120,0.03276977936426798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,4096,0.041464000940322876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,4096,0.027087999714745417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,2560,0.011295110815101199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,3584,0.039628442790773176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,3584,0.025272889269722834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,2048,0.00998222248421775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,3072,0.023523555861579046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,3072,0.03698577814631992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,2560,0.03465777635574341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,2560,0.02181600034236908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,2048,0.032764444748560585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,2048,0.019489778412712943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,1536,0.03090488910675049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,768,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,1536,0.016922665966881644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,512,0.004910222358173794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,1024,0.015448000695970325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,768,0.025756445195939805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,768,0.014553777045673795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,256,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,512,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,512,0.025010666913456384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,128,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,256,0.023640000157886084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,64,0.0035626664757728577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,128,0.013110222087966071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,128,0.020571556356218126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,32,0.003896000070704354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,64,0.01277599980433782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,32,0.013343999783198038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,65536,0.16830133067237008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,51200,0.12979022661844888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,65536,0.2635626792907715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,1536,0.008571555217107138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,7168,1024,0.006618666566080517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,16384,0.048435555564032666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,51200,0.20346666706932914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,7168,1024,0.02568622264597151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,12288,0.03546133306291368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,16384,0.07339288791020711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,7168,256,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,65536,0.31961245006985134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,12288,0.057201776239607066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,10240,0.031333333916134305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,8192,0.026495999760097925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,12288,0.07877333296669854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,10240,0.049357334772745766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,10240,0.06993422243330213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,8192,0.04011911153793335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,8192,0.059346669250064425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,6144,0.019834667444229126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,7168,0.03669866588380601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,7168,0.05546666516198052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,5120,0.016901334126790363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,6144,0.03270666797955831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,4096,0.014370666609870063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,5120,0.04696711235576206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,5120,0.029671112696329754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,3584,0.012799111505349478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,4096,0.02492622203297085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,4096,0.04065777858098348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,3072,0.011785777906576792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,3584,0.023390221926901076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,3584,0.03918933206134372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,2560,0.010409778190983666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,3072,0.021947556071811255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,16384,0.09651022487216526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,2048,0.008951110972298516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,2560,0.020288000504175823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,2560,0.03433955709139506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,1536,0.00793599999613232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,51200,0.2526328828599718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,2048,0.03240177697605557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,7168,0.022713777091768052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,1024,0.0058257778485616045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,1536,0.015862221519152325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,1536,0.028397334946526423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,1024,0.026383111874262493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,1024,0.014471999473041959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,512,0.004850666556093427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,768,0.013915555344687568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,768,0.026178666286998328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,256,0.004182222402758068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,512,0.01347644461525811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,512,0.02365511159102122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,6144,0.0507226652569241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,128,0.003912888881233004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,256,0.01275288893116845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,256,0.0232968893316057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,64,0.003567999849716822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,128,0.020961778031455144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,64,0.012437333663304647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,6144,3072,0.03697333402103848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,32,0.012445333103338877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,65536,0.15972710980309382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,51200,0.11496888266669379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,2048,0.01793244481086731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,65536,0.25250665346781415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,768,0.0052284445199701525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,16384,0.03977333174811469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,51200,0.2017057736714681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,12288,0.03262133399645487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,16384,0.09531822469499375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,12288,0.055917335881127246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,10240,0.02737688852681054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,65536,0.3197253280215793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,12288,0.07804266611735027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,51200,0.2505653434329563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,8192,0.022600889205932617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,6144,128,0.012461333639091916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,10240,0.047409776184293956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,7168,0.019839111301634047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,10240,0.06874755356046888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,6144,0.01738577749994066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,8192,0.038775109582477145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,8192,0.05900355842378405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,7168,0.035628444618648954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,5120,0.015142222245534262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,7168,0.05484444565243191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,4096,0.013392888837390475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,6144,0.032305777072906494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,5120,0.04660088817278544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,5120,0.028789334826999243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,3584,0.012139555480745105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,4096,0.040989332728915744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,3072,0.011014222270912595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,3584,0.02279022170437707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,3584,0.03936977850066291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,2560,0.009717333647939894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,3072,0.021379555265108745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,16384,0.0724782215224372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,3072,0.03639288743336996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,2048,0.008736888567606607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,2560,0.03427377674314711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,2560,0.0195777780479855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,1536,0.0069439998931354946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,2048,0.01716977854569753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,2048,0.030213332838482324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,1024,0.005850666513045629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,1536,0.030435555511050757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,1536,0.015863999724388123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,6144,32,0.003559999995761447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,768,0.004565333326657613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,512,0.0042444442709287005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,1024,0.014260444376203748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,1024,0.026050666968027752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,256,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,768,0.025713778204388086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,768,0.013811555173661975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,128,0.003489777859714296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,512,0.023698666029506262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,512,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,64,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,256,0.024333332975705464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,256,0.01272266689274046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,5120,32,0.003579555700222651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,128,0.02090488870938619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,128,0.012715555727481842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,64,0.012741333080662621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,4096,0.02455644475089179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,5120,32,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,65536,0.1105911135673523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,16384,0.03256533212131924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,51200,0.08851733472612168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,65536,0.2213102181752523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,12288,0.025800888737042744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,16384,0.06079466475380791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,16384,0.09258488814036052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,10240,0.0224924451775021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,12288,0.04674311147795784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,12288,0.07563022110197279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,8192,0.018732445107565988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,10240,0.040580444865756564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,65536,0.3091955449846056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,10240,0.06692533360587226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,7168,0.015764445066452026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,8192,0.03371555606524149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,8192,0.0572942230436537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,6144,0.014780445231331719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,7168,0.03105866577890184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,7168,0.0532168878449334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,5120,0.012921777864297232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,5120,6144,0.05032533407211304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,6144,0.04929955469237434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,4096,0.01148888882663515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,5120,0.04544533292452494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,3584,0.010663111176755695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,4096,0.02200800014866723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,4096,0.03981511129273309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,3072,0.009299555586444007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,3584,0.020619556307792664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,3584,0.038431111309263445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,2560,0.008635555704434713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,3072,0.019550222489568923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,51200,0.1687164439095391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,2048,0.00776088900036282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,2560,0.017553778158293832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,2560,0.03356711069742838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,1536,0.006224888894293044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,2048,0.015815110670195687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,2048,0.029883556895785864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,1024,0.005201777650250329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,51200,0.24302487903171113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,1536,0.014541332920392355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,768,0.004538666870858935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,1536,0.028157333532969158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,1024,0.013832000394662222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,1024,0.02605777813328637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,512,0.004171555654870139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,768,0.025705777936511572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,768,0.013359111216333179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,256,0.003913777983850903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,512,0.02399377855989668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,512,0.012853333519564735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,6144,0.028840889533360798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,128,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,256,0.023129777775870428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,256,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,64,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,5120,0.02623733381430308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,4096,32,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,128,0.020609777834680345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,128,0.012111110819710625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,64,0.01203644441233741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,65536,0.10222933027479385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,51200,0.08786044518152873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,16384,0.034619556532965765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,65536,0.2154017819298638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,4096,3072,0.0338986681567298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,12288,0.029063112205929224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,51200,0.1658533281750149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,16384,0.0601102246178521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,10240,0.024655110306209985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,16384,0.09188177850511338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,12288,0.047206223011016846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,12288,0.07527022229300605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,10240,0.03991644581158956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,10240,0.06646044386757745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,51200,0.2407991091410319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,7168,0.018062222335073683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,65536,0.3086577786339654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,8192,0.03386044502258301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,6144,0.016355555918481614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,8192,0.05682133303748237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,5120,0.014128888646761576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,7168,0.05299644337760078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,7168,0.03102488981352912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,6144,0.02831733226776123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,6144,0.04915111263593038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,5120,0.04522666666242811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,5120,0.025740444660186768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,3584,0.009686222506894005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,4096,0.03998311029540168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,4096,0.021701332595613267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,3072,0.009154666629102495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,3584,0.020215999748971727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,3584,0.0377439988984002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,2560,0.008294222255547842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,4096,32,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,3072,0.018568888306617737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,3072,0.03458933366669549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,2048,0.007377777662542131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,1536,0.006278222219811545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,2560,0.01751377847459581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,2560,0.03117155697610643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,1024,0.0052684446175893145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,2048,0.01574133336544037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,1536,0.028119110398822363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,1536,0.014512000812424554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,768,0.0047493332790003884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,1024,0.013742222554153867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,1024,0.026093333959579468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,512,0.004348444441954295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,768,0.025416889124446448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,768,0.013422222601042854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,8192,0.020821332931518555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,256,0.003912000192536248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,512,0.01308444473478529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,128,0.0035439998739295532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,256,0.023365333676338196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,256,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,128,0.020273778173658583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,64,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,32,0.0034799998005231223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3584,4096,0.010654222634103564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,64,0.012049777640236748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,65536,0.09386666615804036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,32,0.011766222616036734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,51200,0.07535022497177124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,65536,0.21007111337449816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,51200,0.16274933020273843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,16384,0.0317884451813168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,2048,0.029883556895785864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,16384,0.058240003055996366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,12288,0.02167822255028619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,16384,0.09184355868233575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,65536,0.3074737654791938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,51200,0.23959822124905059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,10240,0.018180444836616516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,12288,0.04492177897029453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,8192,0.015267555912335714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,12288,0.0749537746111552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,7168,0.014120888378885059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,10240,0.03908088803291321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3584,512,0.024381332927280005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,10240,0.06646933158238728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,6144,0.012968888713253869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,8192,0.03308444552951389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,8192,0.05636622508366903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,5120,0.011003555523024665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,7168,0.052863111098607383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,7168,0.03030844529469808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,6144,0.02794044547610813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,6144,0.048784001006020435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,3584,0.009024000002278222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,5120,0.04516266783078512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,5120,0.025458667013380263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,3072,0.008625778059164682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,4096,0.021352888809310064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,4096,0.03968711031807794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,2560,0.007369777394665613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,3584,0.03583200110329522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,3584,0.019553777244355943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,2048,0.0069022224181228215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,3072,0.017900443739361234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,2560,0.031558222240871854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,2560,0.01717688971095615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,1536,0.005554666535721884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,2048,0.029281778468026057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,2048,0.015400000744395785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,1024,0.004846222284767362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,1536,0.014780445231331719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,1024,0.013528000149461957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,768,0.004233777936961916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,768,0.01312888910373052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,768,0.024353777368863423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,512,0.0038817777401871155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3584,128,0.012179555164443122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,4096,0.009986666341622671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,256,0.003526222374704149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,512,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,512,0.02372177773051792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,128,0.0032426667296224167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,256,0.023018666439586218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,256,0.01238933371173011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,64,0.003152888889114062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,3072,0.03528177738189697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,128,0.0121760004096561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,3072,32,0.0035217776894569397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,128,0.019575110740131803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,64,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,65536,0.07824089129765828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,3072,32,0.012284444438086616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,1536,0.027405333187845018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,51200,0.06159910890791151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,3072,1024,0.024529778295093115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,65536,0.20895822842915854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,51200,0.16193866729736328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,16384,0.05495822098520067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,16384,0.09080533186594646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,51200,0.23921600977579752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,65536,0.30616890059577095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,12288,0.044365333186255566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,12288,0.07380355728997125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,8192,0.015071110592948066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,10240,0.0388373335202535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,10240,0.06567111280229357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,8192,0.03251111176278856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,7168,0.013558222187889947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,6144,0.012492444780137805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,8192,0.056377775139278836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,7168,0.05258311165703667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,7168,0.030233777231640283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,5120,0.01127377814716763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,6144,0.0277528895272149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,6144,0.04840088884035746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,4096,0.009992000129487779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,5120,0.04473511046833462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,5120,0.024734222226672705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,3584,0.008986666798591614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,4096,0.03737866547372606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,3072,0.008291555775536431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,3584,0.01888533267709944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,3584,0.03734488950835334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,2560,0.007260444263617198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,3072,0.01756800048881107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,12288,0.02279288901223077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,3072,0.03293244375122918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,2048,0.006343110981914733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,2560,0.016512889001104567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,2560,0.031106667386160955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,1536,0.005607999861240387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,2048,0.029469334416919287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,2048,0.015356444650226168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,1024,0.004873777843183941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,1536,0.02741066614786784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,1536,0.014281777871979607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,768,0.0041599998043643106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,1024,0.026047110557556152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,512,0.0038444445365005066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,768,0.024275556206703186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,768,0.013066666821638743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,256,0.003548444559176763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,512,0.0236791107389662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,512,0.01277955538696713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,128,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,256,0.012103999654452005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,256,0.024319110645188227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,64,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2560,128,0.020119110743204754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,32,0.003152888889114062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,4096,0.02058577703105079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,64,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,16384,0.028668443361918133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,32,0.011679111255539788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,51200,0.050247109598583646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,65536,0.16940532790289986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,51200,0.13015911314222547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,16384,0.0222044438123703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2560,10240,0.02021511064635383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,16384,0.04591111010975308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,65536,0.30284354421827525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,51200,0.23866666687859428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,16384,0.09057777457767063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,10240,0.0165964447789722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,1024,0.013410666750537025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,8192,0.014468444718254937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,12288,0.073725336127811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,10240,0.03248000144958496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,10240,0.06541599829991658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,7168,0.01312444441848331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,8192,0.02770311137040456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,8192,0.056017776330312095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,6144,0.011687111523416309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,7168,0.05247999893294441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,7168,0.02569777766863505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,5120,0.010674667027261523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,6144,0.02401955591307746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,6144,0.04853866828812493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,65536,0.06049955553478665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,4096,0.009091555244392818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,5120,0.021384000778198242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,3584,0.008715555899673039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,5120,0.04262488749292162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,4096,0.017857778403494094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,3072,0.007819555699825287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,3584,0.017222222354676988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,3584,0.035629332065582275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,2560,0.006837333242098491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,3072,0.016152888536453247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,3072,0.03298844562636481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,2048,0.005565333283609814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,2560,0.015135111080275642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,12288,0.020641777250501845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,2560,0.03087200058831109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,1536,0.004912888838185204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,2048,0.014171555638313293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,2048,0.029170665476057265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,1024,0.0041884444653987885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,1536,0.027296000056796606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,1536,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,768,0.004218666503826777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,1024,0.0247022228108512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,512,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,768,0.024749333659807842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,768,0.012455999851226807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,256,0.003524444583389494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2560,128,0.012086222569147745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,512,0.012383999923865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,512,0.023032888770103455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,128,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,256,0.012079999678664737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,256,0.02347466680738661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,64,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,128,0.02035555574629042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,2048,32,0.0032346666687064697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,2048,4096,0.039220445685916476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,65536,0.04900888933075798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,64,0.011988444460762871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,32,0.011471110913488599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,51200,0.04167733258671231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,65536,0.16596355703141955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,51200,0.12834133042229548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,16384,0.01905155513021681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,65536,0.30252355999416775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,51200,0.23713599310980904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,12288,0.03615199857287937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,16384,0.045223110251956515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,12288,0.016200888488027785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,16384,0.08978844351238674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,10240,0.014658666319317289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,1024,0.012849777936935425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,8192,0.014081777797804939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,12288,0.07312266694174872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,12288,0.03561333484119839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,10240,0.06535555256737603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,8192,0.05582133266660902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,8192,0.02737066646416982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,7168,0.025069332785076563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,7168,0.05173066589567396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,5120,0.01018044435315662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,6144,0.022451554735501606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,6144,0.04803911182615492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,2048,128,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,4096,0.00850577818022834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,5120,0.02115999990039402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,5120,0.04236800140804715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,3584,0.007625777688291337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,4096,0.03713599840799967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,4096,0.017535999417304993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,3072,0.0069546666410234236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,3584,0.035692443450291954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,3584,0.01682933337158627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,2560,0.006315555423498154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,3072,0.032864888509114586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,3072,0.01586577792962392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,2048,0.005934222290913264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,1536,0.005211555709441503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,2560,0.015116444892353482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,2560,0.031173331869973078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,2048,0.029142220815022785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,2048,0.014163555370436775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,1536,0.02755111124780443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,1536,0.013401777380042605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,768,0.0041759999261962045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,1024,0.025417778227064345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,1024,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,512,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,768,0.02504088812404209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,768,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,10240,0.0322382218307919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,256,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,512,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,512,0.023432888918452795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,128,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,6144,0.011390222443474663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,256,0.011772444678677453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,64,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,32,0.0031848889258172777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,128,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,128,0.020248000820477802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,65536,0.037447998921076454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,64,0.011432888607184092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1536,32,0.011535999675591787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,51200,0.030815998713175457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,65536,0.16388621595170763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,16384,0.015562666787041558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,51200,0.12588000297546387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,65536,0.3028808964623345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,51200,0.2358000013563368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,16384,0.04327822062704298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,12288,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,16384,0.08957688675986396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,10240,0.012544000314341651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,12288,0.035042666726642184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,12288,0.07285422086715698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,8192,0.01384800010257297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,10240,0.03144355614980062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,10240,0.06481244166692098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,7168,0.012366222010718452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,8192,0.02641777859793769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,7168,0.012649777862760754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,6144,0.01128000020980835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,7168,0.024671110841963027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,7168,0.05039822061856588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,5120,0.009713778065310584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1536,256,0.022295110755496558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,6144,0.022852443986468848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,6144,0.046577778127458364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,4096,0.008288000192907121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,3584,0.007546666595670912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,5120,0.02036355601416694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,4096,0.0369759996732076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,4096,0.017204445269372728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,3072,0.006803555621041193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,3584,0.03532977898915609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,3584,0.01649777756796943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,2560,0.006081777728266186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,3072,0.015788444214397006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,2048,0.005528888768619961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,2560,0.030591110388437908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,2560,0.014841778410805596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,1536,0.004932444542646408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,2048,0.029123554627100628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,2048,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,1024,0.004179555508825514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,1536,0.01309866706530253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1536,1024,0.004570666700601578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,1536,0.026833777626355488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,768,0.003863111138343811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,1024,0.012720888687504662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,1024,0.024392889605628118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,512,0.0034808889031410217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,768,0.024775111012988623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,768,0.01238666640387641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,256,0.00319377767542998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,8192,0.05550133188565572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,512,0.02366222275627984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,128,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,256,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,256,0.0236826671494378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,1024,32,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,128,0.01955200069480472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,128,0.011702222128709158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,65536,0.03127911024623447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,5120,0.04191199938456217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,64,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,51200,0.024280000064108107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,32,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,16384,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,65536,0.16308711634741888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,51200,0.12428889009687637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,1024,3072,0.03231199913554721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,16384,0.04360711243417528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,12288,0.012989333106411828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,10240,0.011504888534545898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,16384,0.08891733487447102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,51200,0.2365430990854899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,8192,0.010646222366227044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,12288,0.03484800126817491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,12288,0.07302221986982557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,10240,0.06351733207702637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,7168,0.01000711073478063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,10240,0.030897776285807293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,6144,0.009339555270142024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,8192,0.05370222197638618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,5120,0.008919110728634728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,7168,0.04930222365591261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,7168,0.02370577719476488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,6144,0.04572888877656725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,6144,0.02197866638501485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,5120,0.020073778099483915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,1024,512,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,4096,0.01754044493039449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,3584,0.007275555696752336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,4096,0.036622222926881574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,3072,0.006587555425034628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,3584,0.03452000021934509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,3072,0.015860444969601102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,3072,0.0325288905037774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,2560,0.014771555860837301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,65536,0.3016480074988471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,2048,0.005327111317051782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,2560,0.03071199854214986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,2048,0.013759111364682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,2048,0.028601778878106013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,8192,0.025437333517604407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,1536,0.004874666531880696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,1024,0.0041777777175108595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,4096,0.007711110843552484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,1536,0.01314133322901196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,1536,0.02752711044417487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,768,0.003968888686762916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,1024,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,1024,0.024367999699380662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,512,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,768,0.01255555533700519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,768,0.024693333440356787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,256,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,512,0.02369511127471924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,512,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,3584,0.01686044368478987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,128,0.0029528888149393927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,256,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,256,0.023383110761642456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,32,0.002871111035346985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,128,0.011693333586057028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,128,0.020287111401557922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,2560,0.005943999936183293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,65536,0.025598223010698955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,64,0.011384000380833944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,51200,0.020557334025700886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,768,32,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,16384,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,65536,0.16148622830708823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,51200,0.12366844548119439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,16384,0.04266755448447334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,12288,0.013460444079505073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,51200,0.23471911748250326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,16384,0.08896978033913507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,12288,0.03424355718824599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,10240,0.030510223574108545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,8192,0.010984000232484607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,768,5120,0.04176355401674906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,10240,0.06441866689258151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,7168,0.009993777506881291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,8192,0.054238223367267184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,8192,0.02550933261712392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,6144,0.009676444033781687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,7168,0.02366755571630266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,768,64,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,5120,0.008348444269763099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,6144,0.04550310969352722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,6144,0.021963554951879714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,4096,0.007752888732486301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,5120,0.019892444213231403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,5120,0.04175466630193922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,3584,0.007257777783605788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,4096,0.017532444662517972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,4096,0.036630223194758095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,3072,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,3584,0.01682933337158627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,65536,0.3007297780778673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,2560,0.00590133335855272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,3072,0.032568001084857516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,3072,0.015795555379655626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,10240,0.012034667034943899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,2048,0.005227555417352253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,1536,0.004601777841647466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,12288,0.07268355290095012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,2560,0.014827556080288358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,1024,0.004171555654870139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,2048,0.013821333646774292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,1536,0.013119999733236102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,768,0.003866666720973121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,1024,0.025407110651334126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,768,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,768,0.025012445118692186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,512,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,7168,0.048898667097091675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,256,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,512,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,512,0.02336799932850732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,128,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,256,0.011704000333944956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,256,0.022970666488011677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,64,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,128,0.011426666544543372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,128,0.019941333267423842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,512,32,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,65536,0.018346667289733887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,64,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,3584,0.03546222382121616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,32,0.011408000356621213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,51200,0.015450666348139444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,2560,0.031168888012568157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,65536,0.15971644719441733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,2048,0.028765334023369685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,16384,0.010305778019958073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,51200,0.12229066424899632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,65536,0.3019377655453152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,512,1536,0.027395556370417278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,12288,0.008977777428097194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,10240,0.009372444616423713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,512,1024,0.01240533341964086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,51200,0.23670487933688691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,16384,0.08843021922641331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,8192,0.008345777789751688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,12288,0.0329440004295773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,7168,0.007988444632954067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,10240,0.029520889123280842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,8192,0.02539288832081689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,8192,0.052941332260767617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,6144,0.007657777931955125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,7168,0.023630221684773762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,7168,0.04890133274926079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,5120,0.007974222302436829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,6144,0.021595555875036452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,6144,0.045201778411865234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,4096,0.007607999775144789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,5120,0.019888000355826486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,5120,0.041542222102483116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,3584,0.007247111035717859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,4096,0.03701600101259019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,4096,0.017214222086800467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,3072,0.00629066675901413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,3584,0.016881777180565726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,2560,0.005920889063013925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,3072,0.01568533314598931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,2560,0.015124445160230001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,2560,0.030870222383075293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,2048,0.005107555538415909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,16384,0.041088889042536415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,2048,0.013771555489963956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,1536,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,12288,0.07124266359541151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,1024,0.003839111162556542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,10240,0.06181333462397257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,1536,0.01314933349688848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,1536,0.027055111196306016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,768,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,1024,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,1024,0.02439022229777442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,512,0.0031439999325407874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,768,0.02502044373088413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,768,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,256,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,512,0.011781333221329583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,128,0.0028888889484935333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,256,0.023358222511079576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,256,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,64,0.002521777732504739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,128,0.020591111646758187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,128,0.011424889167149862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,3584,0.03498311175240411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,256,32,0.002510222295920054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,64,0.011408000356621213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,65536,0.015464888678656684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,3072,0.032856888241238065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,256,32,0.011349333657158745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,65536,0.15758489237891302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,16384,0.009478222164842818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,51200,0.11973599592844646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,65536,0.300289789835612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,2048,0.029356443219714697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,51200,0.23511823018391928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,12288,0.008615111311276754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,10240,0.00868977771864997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,16384,0.08662222491370307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,16384,0.040720889965693154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,8192,0.007992888490358988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,12288,0.032962666617499456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,12288,0.07015199793709649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,7168,0.007987555530336168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,10240,0.029059555795457628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,10240,0.06152711311976115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,6144,0.007294221884674496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,8192,0.025202666719754536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,8192,0.05295200149218241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,5120,0.008264000217119852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,7168,0.023064000738991633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,7168,0.04871999886300829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,4096,0.007491555478837755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,6144,0.04485599862204658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,256,512,0.022300443715519373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,3584,0.007246221933099959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,5120,0.04140533341301812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,3072,0.006728000111050076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,4096,0.036306666003333196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,3584,0.03427733315361871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,3584,0.016230222251680162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,2560,0.006285333385070165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,3072,0.01569422251648373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,51200,0.013793778088357715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,2560,0.014481777946154276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,2048,0.006248888870080312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,2560,0.030870222383075293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,1536,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,2048,0.028563555743959215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,2048,0.013436444103717804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,1024,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,1536,0.02679377794265747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,1024,0.01238222254647149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,768,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,1024,0.024338665935728285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,768,0.024633778466118708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,768,0.012030222349696688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,512,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,6144,0.02126933303144243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,512,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,256,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,512,0.022687999738587275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,128,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,4096,0.01753155555990007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,256,0.02292355563905504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,256,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,64,0.002524444419476721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,128,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,3072,0.03219377663400438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,65536,0.014431110686726041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,64,0.011008000208271874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,32,0.01107022249036365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,51200,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,16384,0.00963199966483646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,65536,0.15939554903242323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,1536,0.01310488912794325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,16384,0.04110399881998698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,51200,0.12115644084082709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,10240,0.007646222081449296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,8192,0.0069653333889113525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,12288,0.03263911273744371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,10240,0.029463112354278564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,7168,0.006911110960774952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,8192,0.025026667449209426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,6144,0.00656444455186526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,5120,0.006224000205596288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,7168,0.023152889476882085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,4096,0.006566222343179915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,6144,0.021264889174037512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,3584,0.006264888991912206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,5120,0.01992266707950168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,128,5120,0.019906666543748643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,3072,0.006216889040337668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,2560,0.0063493334584765965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,4096,0.017166222135225933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,2048,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,3584,0.016114667057991028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,3072,0.015792000624868605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,1536,0.0042239998777707415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,256,128,128,0.019912888606389362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,1024,0.003823111040724648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,2560,0.014640889234013028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,768,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,2048,0.013759111364682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,512,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,256,0.0028897778441508612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,1536,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,1024,0.012358222570684222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,768,0.01239377756913503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,64,0.0027946666296985415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,512,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,32,0.002578666640652551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,128,0.011055111057228513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,65536,0.013749333719412485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,64,0.011390222443474663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,51200,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,65536,0.15864977571699354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,51200,0.11869688828786214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,16384,0.008963555925422246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,12288,0.008268444074524773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,16384,0.04000622365209792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,12288,0.03250666790538364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,10240,0.0076453329788313965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,8192,0.007280000381999546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,10240,0.029150221082899306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,128,32,0.002487999904486868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,8192,0.02507466740078396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,7168,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,6144,0.006732444382376141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,5120,0.006285333385070165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,7168,0.02327555583582984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,128,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,4096,0.0059057776298787855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,3584,0.006291555447710886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,5120,0.019885333047972787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,256,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,3072,0.006211555666393704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,4096,0.01722133325205909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,2560,0.006617777877383762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,64,12288,0.008288000192907121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,2048,0.006254222244024277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,3584,0.016161777906947665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,64,32,0.011015999648306104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,3072,0.015832000308566622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,1536,0.004519999855094486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,1024,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,2560,0.014780445231331719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,768,0.003527111063400904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,2048,0.013537777794731988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,512,0.0032186667538351486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,1536,0.013058666553762225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,256,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,1024,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,128,0.002513777878549364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,768,0.012413333687517377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,64,0.002551111082235972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,512,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,256,32,32,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,256,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,128,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,64,0.01147911118136512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,32,0.01069777790043089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,12288,0.310208002726237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,16384,0.49603822496202254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,12288,0.2772791120741102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,16384,0.36673333909776473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,8192,0.20140711466471353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,10240,0.2466968960232205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,8192,0.18857244650522867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,10240,0.23353245523240831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,7168,0.1775697734620836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,6144,0.15204977989196777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,51200,1.1392996046278212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,7168,0.16594933138953313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,5120,0.12960267066955566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,6144,0.1467048856947157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,4096,0.10731466611226399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,51200,1.5245013766818578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,4096,0.10081599818335639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,3072,0.08210221926371257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,3584,0.08973422315385605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,5120,0.12063466178046332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,2560,0.06753066513273451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,2048,0.0562631090482076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,1536,0.04349866509437561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,256,32,6144,0.021014221840434607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,2048,0.05990488661660088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,1024,0.033026665449142456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,1536,0.04855733447604709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,2560,0.06895733541912503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,768,0.02583733366595374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,512,0.018983999888102215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,256,0.012807110945383707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,1024,0.03966755668322245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,3072,0.0780328909556071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,128,0.011653333074516721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,64,0.009308444129096137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,32,0.009257777697510189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,768,0.03394488824738397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,256,0.025785777303907607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,128,0.024703111913469102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,64,0.024706666668256123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,512,0.02910311023394267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,65536,32,0.02931200133429633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,16384,0.32880711555480957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,65536,3584,0.09338755740059747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,16384,0.29470756318834096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,12288,0.24967288970947266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,10240,0.17540178034040663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,12288,0.2233048809899224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,8192,0.14549956056806776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,51200,0.9028106265597873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,51200,1.0214719772338867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,10240,0.18581510914696586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,7168,0.12552889188130698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,8192,0.15430488851335314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,6144,0.11714666419559056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,65536,1.317986700269911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,5120,0.09251022338867188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,7168,0.13387021753523085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,6144,0.11746933725145127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,3584,0.06707111332151625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,5120,0.09866222408082749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,3072,0.058393776416778564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,4096,0.07954844501283434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,2560,0.04900711112552219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,2048,0.04212977819972568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,3584,0.07348977857165866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,1536,0.03426577647527059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,1024,0.024596444434589807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,2560,0.057447108957502574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,3072,0.06471200121773614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,1536,0.041794667641321816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,768,0.0188071115149392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,4096,0.08360622326533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,512,0.014208000567224292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,1024,0.0342497792508867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,2048,0.04983466532495287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,256,0.012086222569147745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,128,0.010324444207880232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,64,0.0090515555606948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,768,0.028488887680901423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,51200,32,0.009700444837411245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,512,0.024907555845048692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,256,0.023039110832744177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,128,0.02162133322821723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,64,0.021663111117151048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,65536,1.1791138119167752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,51200,32,0.02560088866286808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,16384,0.11187556054857041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,51200,0.3086177772945828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,12288,0.08727555804782444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,65536,0.39241600036621094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,51200,0.35422754287719727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,16384,0.11832266383700901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,10240,0.07058488660388522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,65536,0.4435448911454942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,10240,0.07648177941640218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,7168,0.051706665092044406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,12288,0.09089422225952148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,6144,0.04511022236612108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,8192,0.06486933098898993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,5120,0.03833511140611436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,4096,0.032744000355402626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,3584,0.028905779123306274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,6144,0.05192000004980299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,5120,0.04318933354483711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,3072,0.025812443759706285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,4096,0.0373582210805681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,2560,0.021635555558734473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,2048,0.018114666144053142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,3072,0.03160266743765937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,3584,0.03464711043569777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,2560,0.027463111612531874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,1024,0.011053333679835001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,2048,0.024320888850424025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,768,0.009679111341635386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,512,0.007616000043021307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,1536,0.021936888496081035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,1024,0.01937955617904663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,256,0.005554666535721884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,768,0.017514665921529133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,128,0.0048062221871482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,512,0.01650311052799225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,64,0.00462311092350218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,32,0.005222222043408289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,256,0.015134221977657743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,128,0.014504000544548035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,64,0.01481244464715322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,32,0.014479999740918478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,8192,0.05963022179073758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,65536,0.29462843471103245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,51200,0.2306906647152371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,16384,7168,0.05786222219467163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,16384,0.07690578036838107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,65536,0.3804319964514838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,12288,0.061145775847964816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,10240,0.050880889097849526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,51200,0.29579467243618435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,8192,0.04295733239915636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,16384,0.10282578070958455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,7168,0.037760890192455716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,6144,0.03272533416748047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,10240,0.06738489203982882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,16384,1536,0.014399111270904541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,8192,0.05734399954477946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,5120,0.028757333755493164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,4096,0.024432889289326135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,7168,0.05246399839719137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,12288,0.07998310857348971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,6144,0.046952890025244824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,3072,0.01905333333545261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,5120,0.03851999839146932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,2560,0.016157334049542744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,4096,0.0337137778600057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,2048,0.013800000150998434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,3584,0.031128889984554712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,1536,0.011007111105653973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,3072,0.027327110370000202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,1024,0.009647111097971598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,768,0.008328888979223039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,2560,0.025203555822372437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,2048,0.022346667117542688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,1536,0.020058666666348774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,256,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,1024,0.01754666699303521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,768,0.016579555140601266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,128,0.0042239998777707415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,64,0.004039999925427967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,512,0.015480889214409722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,256,0.014152000347773233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,128,0.013497778111033969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,64,0.01387466655837165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,12288,32,0.014141332772043018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,65536,0.23321244451734754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,51200,0.18454578187730578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,16384,0.06288533078299628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,65536,0.3361813227335612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,12288,0.049426668220096164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,51200,0.26194310188293457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,10240,0.041217777464124895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,16384,0.09213955534829034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,12288,0.07177422444025676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,3584,0.021589333812395733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,10240,0.06085689200295342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,7168,0.030579557021458943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,6144,0.027473777532577515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,8192,0.05158933334880405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,5120,0.023503111468421087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,512,0.006562666760550604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,7168,0.04705511199103462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,6144,0.04217866725391812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,3584,0.01713244451416863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,5120,0.03455377618471781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,12288,32,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,3072,0.015464888678656684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,2560,0.013438222308953604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,3072,0.02565244502491421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,2048,0.011799111134476133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,2560,0.023038221730126276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,1536,0.00996977753109402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,2048,0.021198223034540813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,1024,0.00832177781396442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,1536,0.01891377733813392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,768,0.006837333242098491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,1024,0.0162764439980189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,512,0.005559111220969095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,8192,0.035960889524883695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,768,0.015791111522250705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,256,0.004576888763242298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,128,0.0041626666982968645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,64,0.0038942222793896994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,512,0.014766222900814481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,256,0.013798221945762634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,32,0.0041724443435668945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,128,0.0131217779384719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,64,0.01314755529165268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,10240,4096,0.01999288962946998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,32,0.014903111590279473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,4096,0.030236442883809406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,65536,0.2418382167816162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,16384,0.06399466594060262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,51200,0.18853510750664604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,12288,0.050198223855760365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,65536,0.28834578726026744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,10240,0.042061332199308604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,51200,0.2264497809939914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,16384,0.08095466428332858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,8192,0.03568177753024631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,7168,0.03122133347723219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,12288,0.06323822339375813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,6144,0.027278222971492346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,10240,0.05368355578846402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,5120,0.023616888456874426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,8192,0.04611644479963514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,4096,0.01982133256064521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,6144,0.03656355539957682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,7168,0.041391998529434204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,3584,0.017532444662517972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,3072,0.015492444237073263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,5120,0.030718220604790583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,2048,0.011694221860832639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,3584,0.025409777959187824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,3072,0.023524444964196947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,1536,0.009684444301658207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,2560,0.021448888712459143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,1024,0.008245333201355403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,2048,0.019666666785875957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,768,0.005917333480384614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,512,0.005020444591840108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,1536,0.017473777135213215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,1024,0.01535288823975457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,256,0.0042239998777707415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,128,0.003931555483076307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,768,0.014820444915029736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,64,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,512,0.014456000592973499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,256,0.013134222063753339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,32,0.0038728887836138406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,128,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,64,0.012770666844315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,32,0.012780444489585029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,10240,3584,0.02753777801990509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,65536,0.1792551146613227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,51200,0.14863644705878362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,16384,0.0488319993019104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,12288,0.040447112586763166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,65536,0.2854613463083903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,10240,0.03295022249221802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,51200,0.22244355413648817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,16384,0.07941955327987671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,8192,0.028142223755518597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,12288,0.06226311127344767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,7168,0.025047111842367385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,10240,0.05284622311592102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,8192,2560,0.013386666774749756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,8192,0.04468977782461378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,8192,4096,0.026899556318918865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,7168,0.03941599859131707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,4096,0.016339555382728577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,6144,0.035529779063330755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,3584,0.01498933302031623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,3072,0.0129466669427024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,5120,0.02982577681541443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,2560,0.011544889046086205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,3584,0.02475022276242574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,2048,0.010279999838935005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,3072,0.023023110296991136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,2560,0.02112355497148302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,2048,0.018830221560266282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,1024,0.006913777854707506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,1536,0.01684888866212633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,768,0.005939555664857228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,1024,0.015070221490330167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,512,0.005224888937340842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,768,0.014808000789748298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,256,0.0041857775714662345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,512,0.01404355631934272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,256,0.01312888910373052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,128,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,64,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,6144,0.021301334102948506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,128,0.012724444270133972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,5120,0.018536888890796237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,32,0.003581333491537306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,64,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,32,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,7168,4096,0.026778666509522334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,16384,0.04594399862819248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,12288,0.03628711236847772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,7168,1536,0.008960000342792934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,65536,0.24649866422017416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,16384,0.07003644439909193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,10240,0.031586666901906334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,51200,0.19240266746944854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,8192,0.02590222160021464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,7168,0.022636445032225713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,12288,0.05474755499098036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,6144,0.02034133341577318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,10240,0.04639644424120585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,5120,0.017885333961910672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,8192,0.038741333617104426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,7168,0.035599999957614474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,4096,0.01516711049609714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,6144,0.03179377648565505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,3072,0.012285333540704517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,5120,0.02736977736155192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,4096,0.024341333243581984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,3584,0.022686221533351477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,2560,0.011054221954610614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,2048,0.009739555418491364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,3072,0.021195555726687115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,1536,0.008236444658703273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,1024,0.006918222126033571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,2560,0.019819556011093985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,2048,0.017678222722477384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,768,0.005245333330498801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,512,0.004550222307443619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,1536,0.015847111741701763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,1024,0.014495111174053617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,256,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,768,0.014466666513019137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,128,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,512,0.01367288910680347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,64,0.0035075553589397003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,32,0.003519999898142285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,256,0.012799999780125089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,51200,0.14432177278730604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,65536,0.1667626698811849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,128,0.012773333324326409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,64,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,6144,32,0.012439111040698158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,51200,0.11565511756473118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,16384,0.04279288980695936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,12288,0.03235377868016561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,10240,0.027783112393485174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,65536,0.2412479983435737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,16384,0.06863022512859769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,51200,0.1885653336842855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,12288,0.05294311046600342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,8192,0.023767999476856653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,7168,0.020536889632542927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,6144,0.019204444355434842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,10240,0.04473511046833462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,5120,0.01646844380431705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,6144,3584,0.013436444103717804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,8192,0.0380311111609141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,4096,0.01402844488620758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,7168,0.03427911135885451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,3584,0.012934221989578672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,3072,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,6144,0.031480001078711614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,2560,0.01036888857682546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,5120,0.02699288891421424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,2048,0.009349333743254343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,3584,0.02234933276971181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,1536,0.007968000239796108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,3072,0.020614221692085266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,1024,0.006245333287451003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,2560,0.019319110446506076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,2048,0.01682577696111467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,1536,0.015460444821251763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,1024,0.014416888356208801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,768,0.01422933406300015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,256,0.0038720000949170855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,512,0.013478221992651621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,128,0.003823111040724648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,256,0.0127697777416971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,64,0.0031964443624019623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,65536,0.152563558684455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,128,0.012421333127551608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,32,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,64,0.01276088919904497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,32,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,65536,0.12536711162990993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,51200,0.09861244757970174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,65536,0.20187021626366508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,16384,0.04010755485958523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,51200,0.15880000591278076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,12288,0.02988977895842658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,5120,4096,0.02422933280467987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,10240,0.02522755497031742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,16384,0.05834933121999105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,8192,0.021012443635198805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,768,0.0052871112194326185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,12288,0.04516444603602091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,7168,0.018339556124475267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,10240,0.03780533207787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,6144,0.01670488880740272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,5120,512,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,5120,0.014458666245142618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,8192,0.03272799981964959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,7168,0.030027555094824895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,3584,0.011542222566074796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,6144,0.02777422302299076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,5120,0.024060444699393377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,4096,0.021270222134060327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,3584,0.020049777295854356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,3072,0.018582221534517076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,2560,0.01681511104106903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,1536,0.007273777491516537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,2048,0.015430221954981485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,1024,0.0059279998143513995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,768,0.0052266667286554975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,1536,0.014526221487257214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,512,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,1024,0.013757333159446716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,256,0.0038693332009845306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,768,0.013736888766288757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,128,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,512,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,64,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,256,0.012406222522258759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,32,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,128,0.012090666426552666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,64,0.01204177737236023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,4096,32,0.01275199982855055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,65536,0.10054133335749309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,4096,0.013304000099500021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,51200,0.0827911098798116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,16384,0.03383822242418925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,3072,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,12288,0.029041777054468792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,65536,0.20329866144392225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,2560,0.010572444233629437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,10240,0.024121777878867254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,51200,0.1559120019276937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,16384,0.05626044670740763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,7168,0.017882666654056974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,6144,0.015767110718621146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,12288,0.04371111260520088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,10240,0.03702844513787164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,8192,0.03236533204714457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,5120,0.013840888937314352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,4096,0.011126221881972419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,7168,0.02973244587580363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,3584,0.009983110758993361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,6144,0.027424888478385076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,5120,0.02362488872475094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,3072,0.009377777576446533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,2560,0.008754666480753157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,2048,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,3584,0.01957066688272688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,3072,0.018079110317760043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,1536,0.006280888699822956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,2560,0.01649688846535153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,1024,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,768,0.004908444566859139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,2048,0.015136889285511441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,512,0.004350222233268949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,1536,0.014462222655614218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,1024,0.013697778185208639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,768,0.013467555244763693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,256,0.0035537779331207275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,512,0.013083555632167392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,128,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,64,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,32,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,128,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,64,0.012317332956526013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,65536,0.09417333205540974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,32,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3584,8192,0.020270221763186984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,4096,2048,0.008963555925422246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,51200,0.07918666468726264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,16384,0.03187822302182516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,65536,0.19544266329871285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,12288,0.022671999202834234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,10240,0.018961777289708454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,16384,0.05525777737299601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,51200,0.1529288954204983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,8192,0.01648266613483429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,12288,0.042711112234327525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,7168,0.015122666954994202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,4096,0.021244444780879553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,6144,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,10240,0.036335110664367676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,5120,0.012124444047609964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,8192,0.03194844391610887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,4096,0.010678222609890832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,7168,0.02949777907795376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,3584,0.00962400022480223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,3072,0.008966222405433655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,5120,0.02364088926050398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,2560,0.00832711077398724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,4096,0.02034222251839108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,2048,0.007129777636792924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,3072,0.01762488815519545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,1536,0.005559111220969095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,2560,0.01648000048266517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,1024,0.004873777843183941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,2048,0.01516711049609714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3584,256,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,768,0.0041662222809261745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,512,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,1536,0.014452444182501899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,256,0.0035253332720862497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,1024,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,768,0.013448889056841532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,128,0.0032968889507982465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,512,0.01310755560795466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,64,0.0031439999325407874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,3072,32,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,128,0.011776888536082374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,64,0.012168000141779581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,65536,0.0828533305062188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,32,0.011708444191349877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,51200,0.06719822353786893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,16384,0.02847466535038418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,12288,0.022277333670192297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,65536,0.1934293376074897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,10240,0.022818666365411546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,16384,0.05375555488798353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,8192,0.014704000618722705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,12288,0.04209244582388136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,6144,0.02743911080890232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,7168,0.01369244439734353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,10240,0.03577422102292379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,6144,0.012351999680201212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,3584,0.018927999668651156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,8192,0.031523555517196655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,5120,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,7168,0.029254221253924902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,4096,0.01071466671095954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,3584,0.009604444106419882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,6144,0.02667466633849674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,3072,0.008655110994974772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,4096,0.019719999697473314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,2560,0.00796622203456031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,3584,0.01864622202184465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,2048,0.006968888971540663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,1536,0.0059075554211934405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,3072,0.01735822194152408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,2560,0.016490666402710807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,1024,0.004951999833186467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,768,0.005150222116046482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,2048,0.015136000182893542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,1536,0.014517333772447375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,512,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,3072,256,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,1024,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,768,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,128,0.0032035555276605818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,512,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,64,0.00314666661951277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,32,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,256,0.01238222254647149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,128,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,64,0.012096888489193387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,32,0.01238933371173011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,51200,0.1510968870586819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,51200,0.05385511120160421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,65536,0.15398666593763563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,16384,0.024313777685165405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,51200,0.12029600143432617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,16384,0.04334577918052673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,10240,0.018848000301255118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,8192,0.014016888207859464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,12288,0.03452622228198581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,7168,0.012898666991127862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2560,5120,0.022796443767017786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,10240,0.030155556069480047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,6144,0.011355555719799466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,7168,0.024636444118287828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,5120,0.010606221854686737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,6144,0.023006222314304773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,4096,0.009005332986513773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2560,256,0.003539555602603488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,5120,0.019276445110638935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,3584,0.008608000146018134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,3072,0.0075911109646161394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,4096,0.01753777762254079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,2560,0.0068959999415609576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,3584,0.016869333055284288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,2048,0.005895111295912001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,3072,0.015804444750150044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,65536,0.06989066468344794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,1536,0.00519822206762102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,2560,0.015152888165579902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,1024,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,768,0.003912888881233004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,2048,0.01427288850148519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,512,0.003658666792843077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,1536,0.013452444639470843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,1024,0.01311466677321328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,256,0.0035208890007601846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,768,0.0129120002190272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,128,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,12288,0.020248000820477802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,64,0.002895111011134254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,512,0.012390221986505719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,2048,32,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,256,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,128,0.011544889046086205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,65536,0.05475733346409268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,64,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,32,0.011695110963450538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,51200,0.04519644379615784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,16384,0.018592889110247295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,2048,8192,0.02676800058947669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,10240,0.016929777132140267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,65536,0.15041155285305446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,16384,0.04202311237653097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,51200,0.11826222472720677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,8192,0.0138586668504609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,7168,0.01295111080010732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,10240,0.029841777351167467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,8192,0.026086222794320848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,7168,0.024189333120981853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,4096,0.008989333278603023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,6144,0.02130577796035343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,3584,0.008261333737108443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,5120,0.0188746667570538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,4096,0.017323555217848886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,3072,0.007297777467303806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,2560,0.007256888680987888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,3584,0.016350222958458793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,2048,0.006680888848172293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,3072,0.015834665960735746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,2560,0.014780445231331719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,1536,0.005587555468082428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,1024,0.004547555413511065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,2048,0.013776889277829064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,768,0.004218666503826777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,1536,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,1024,0.012820444173283048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,512,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,256,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,768,0.012712889247470431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,128,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,12288,0.016529776983790927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,256,0.011764444410800934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,64,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,32,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,12288,0.034506665335761175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,128,0.011392888923486074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,64,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,6144,0.011682666838169098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,32,0.011367110742463006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,51200,0.03199822372860379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1536,5120,0.010050666828950247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,16384,0.01573066744539473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,12288,0.014422222971916199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,65536,0.14761600229475233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,10240,0.013070222404268054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,16384,0.040989332728915744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,51200,0.11576799551645915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,12288,0.03351199958059523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,7168,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,10240,0.028927998410330877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,6144,0.0107004443804423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,8192,0.02514044443766276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,7168,0.022673777408070032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,4096,0.00831288927131229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,5120,0.01887822151184082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,3584,0.007426666716734569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,4096,0.016880000631014507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,3072,0.0068986668354935115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,2560,0.005896889087226655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,3584,0.01651733285850949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1536,512,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,3072,0.015455999308162265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,2048,0.005487999982304043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,2560,0.014668444792429606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,2048,0.013744889034165276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,65536,0.03901688920127021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,1024,0.0039822223285834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,1536,0.013426666458447775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,768,0.0038248888320393036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,512,0.003560888684458203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,1024,0.012456888953844706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,768,0.012493333054913415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,256,0.0032711111836963226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,8192,0.011982222398122152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,512,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,128,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,64,0.002875555513633622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,32,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,256,0.011761777930789523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,5120,0.009704888694816166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,64,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,65536,0.032002667586008705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,32,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,6144,0.020933333370420668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,16384,0.013798221945762634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,12288,0.01311377767059538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,51200,0.1139119995964898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,10240,0.01275644451379776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,16384,0.040074666341145836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,8192,0.011398221883508893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,10240,0.027958220905727808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,7168,0.010051555931568146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,1024,1536,0.004881777697139316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,6144,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,7168,0.022642667094866436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,5120,0.009020444419648912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,6144,0.02097333305411869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,4096,0.007958222594526079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,5120,0.01868888901339637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,3584,0.007248889240953658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,4096,0.017118222183651395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,3072,0.006591111007663939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,1024,128,0.011746666497654386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,3584,0.016490666402710807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,2560,0.005933333188295364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,51200,0.027056000298923914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,3072,0.015476443701320224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,2048,0.00555377784702513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,1536,0.00490044429898262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,1024,0.0041964443193541635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,2560,0.014476444986131458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,2048,0.013653332988421122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,768,0.0038293335172865125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,1536,0.013413333230548434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,512,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,256,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,1024,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,12288,0.032285332679748535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,128,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,512,0.012368888490729861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,768,0.012455999851226807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,768,32,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,8192,0.024365334047211543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,128,0.01148977792925305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,64,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,65536,0.02625688910484314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,32,0.01107377807299296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,51200,0.023808000816239253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,16384,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,12288,0.010258666343159145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,10240,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,65536,0.14518577522701687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,51200,0.11279555161794026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,12288,0.03190577692455716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,10240,0.027679110566775005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,7168,0.009558222360081142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,6144,0.009033777647548253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,8192,0.024067555864651997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,5120,0.008623110751310984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,7168,0.022611555125978258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,4096,0.007989333735571967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,6144,0.02108888824780782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,3584,0.007241778075695038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,5120,0.01870666609870063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,3072,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,4096,0.01683911184469859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,2560,0.005948444621430502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,3584,0.016403555870056152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,2048,0.005532444351249271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,65536,0.14698578251732722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,3072,0.015476443701320224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,1536,0.005223111146026188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,1024,0.0042462220622433555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,2560,0.014486221803559197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,768,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,2048,0.013767999907334646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,512,0.003536888708670934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,1536,0.013471999930010902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,768,256,0.011780444118711682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,1024,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,256,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,768,0.012610666453838348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,128,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,64,0.002805333377586471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,512,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,32,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,256,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,128,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,64,0.011394666300879585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,16384,0.03986400034692552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,512,32,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,512,8192,0.01037333326207267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,16384,0.010335110955768162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,12288,0.01000711073478063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,65536,0.14443466398451063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,16384,0.037963555918799505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,51200,0.1109422246615092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,10240,0.009604444106419882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,8192,0.008937777744399177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,12288,0.031179553932613794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,7168,0.008070222205585903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,6144,0.007912889122962952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,10240,0.027113777067926195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,8192,0.023987554841571387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,5120,0.00867022242810991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,4096,0.007576888634098901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,6144,0.02077866593996684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,5120,0.01854933301607768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,3584,0.007272889216740926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,3072,0.006587555425034628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,4096,0.01647200021478865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,2560,0.005579555614127054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,3584,0.01624000072479248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,2048,0.005256888767083486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,2560,0.014111111561457316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,1536,0.004571555389298333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,2048,0.013415999710559845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,1024,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,65536,0.019928889142142404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,1536,0.012905778156386482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,768,0.0035422220826148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,51200,0.017135999268955655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,512,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,256,0.0031519999934567344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,1024,0.012446222205956778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,128,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,768,0.012429333395428128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,512,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,32,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,256,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,128,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,64,0.01129244433508979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,51200,0.015277332729763456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,32,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,16384,0.009670221971140968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,7168,0.02233422299226125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,65536,0.14307199584113225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,12288,0.009688888986905416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,51200,0.1095235546429952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,10240,0.009312888814343346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,16384,0.03782400157716539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,8192,0.008426666259765625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,7168,0.00907466643386417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,12288,0.031145777967241075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,10240,0.02702933384312524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,6144,0.00850666645500395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,8192,0.023780445257822674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,256,3072,0.015126221709781222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,7168,0.02209866709179348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,4096,0.007325333025720384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,3584,0.006937777830494775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,6144,0.02055644492308299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,3072,0.006224000205596288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,5120,0.018216000662909616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,4096,0.01680177781316969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,2560,0.005573333137565189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,3584,0.01588800052801768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,2048,0.004915555732117759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,1536,0.00452622233165635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,3072,0.01482488877243466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,1024,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,2560,0.014475555883513557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,2048,0.013249778085284762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,256,64,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,1536,0.012973333398501078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,512,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,1024,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,256,0.0029519999192820657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,65536,0.017842666970358956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,128,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,768,0.012079999678664737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,64,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,512,0.012064889073371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,32,0.002512000087234709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,256,0.011397333608733283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,65536,0.01447111037042406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,128,0.011587555209795633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,64,0.011056889262464313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,51200,0.01237511138121287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,128,32,0.011024889018800525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,65536,0.14197066095140246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,16384,0.037779556380377874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,51200,0.10997511280907525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,12288,0.009675555759006077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,10240,0.009002666506502364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,5120,0.008671110702885522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,12288,0.030926220946841772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,10240,0.02680977847841051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,7168,0.008967999782827165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,8192,0.023823999696307715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,6144,0.008358221915033128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,5120,0.00794488853878445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,7168,0.02199111051029629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,4096,0.0075795559419526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,6144,0.020607110526826646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,3584,0.006623999940024481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,128,768,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,4096,0.016176889340082806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,3072,0.006211555666393704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,2560,0.005541333307822545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,3584,0.016159110599093966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,2048,0.004921777794758479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,3072,0.01480977733929952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,1536,0.004512888689835866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,2560,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,1024,0.0038151111867692736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,2048,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,768,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,1536,0.01292888902955585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,512,0.0032142222755485107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,1024,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,256,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,768,0.012087999946541257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,128,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,512,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,64,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,256,0.011753777662913004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,8192,0.008316444853941599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,32,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,128,0.011367110742463006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,65536,0.015817777978049386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,64,0.011071999867757162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,32,0.01146933353609509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,16384,0.009352000223265754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,65536,0.14176889260609946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,51200,0.1083279980553521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,12288,0.009719111025333405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,64,5120,0.018234666850831773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,16384,0.03818133473396301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,8192,0.007995555798212687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,7168,0.008969777988062965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,12288,0.030935111973020766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,10240,0.027428444888856676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,6144,0.008626666333940294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,5120,0.007887110941939885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,8192,0.024068444967269897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,4096,0.007339555356237624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,7168,0.02218755582968394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,6144,0.020816889074113634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,3584,0.006765333314736684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,3072,0.006275555739800136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,5120,0.018240888913472492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,2560,0.005535999933878581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,4096,0.016890666551060148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,64,16384,0.009696000152164036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,2048,0.004951999833186467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,1536,0.004573333180612988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,3072,0.015104888214005364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,1024,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,2560,0.014164444473054675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,2048,0.01314133322901196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,1536,0.013455111119482251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,512,0.0031928889867332247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,1024,0.012111999922328524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,256,0.003000000077817175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,768,0.012115555504957834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,128,0.002549333290921317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,51200,0.013515555196338229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,512,0.012255111502276527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,64,0.002507555608948072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,256,0.011448000040319232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,128,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,64,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,32,0.01074044406414032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,10240,0.008952889177534316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,16384,0.4049679968092177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,225,32,3584,0.016368889146380954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,768,0.0034799998005231223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,16384,0.37069066365559894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,225,32,32,0.0028071111689011254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,12288,0.307407988442315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,51200,1.1394240061442058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,51200,1.2722053527832031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,12288,0.27739376491970485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,10240,0.26604000727335614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,10240,0.23386666509840223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,8192,0.2173839939965142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,8192,0.1881075567669339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,7168,0.18963111771477592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,7168,0.1646275520324707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,6144,0.17240711053212485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,8192,0.17605688836839464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,12288,0.2571386761135525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,10240,0.21323733859592012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,5120,0.1380293369293213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,7168,0.15471643871731228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,4096,0.11296978261735703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,5120,0.12110400199890137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,4096,0.10105422470304702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,6144,0.13644888665941027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,3584,0.10085688696967231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,5120,0.11770578225453694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,4096,0.0999315579732259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,3072,0.08710577752855088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,6144,0.14528711636861166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,3072,0.0784133341577318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,2560,0.07571999894248115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,3584,0.09173155493206447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,2560,0.06894577874077691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,2048,0.059501330057779946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,2560,0.07361688878801134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,2048,0.059472892019483775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,1536,0.04751555456055535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,2048,0.06681422392527263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,1536,0.048413332965638906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,1024,0.034252444903055825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,1536,0.05749422311782837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,768,0.026896889011065166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,1024,0.03942133320702447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,1024,0.04896444413397047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,3584,0.08914044168260361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,512,0.019524445136388142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,768,0.03384533193376329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,256,0.012206222448084088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,16384,0.3328782187567817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,512,0.040580444865756564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,128,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,256,0.03605599866973029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,512,0.02934933371014065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,128,0.025058666865030926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,64,0.009332444104883406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,128,0.030951112508773804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,65536,32,0.009951111343171861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,3072,0.08288266923692492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,64,0.02437955637772878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,32,0.030841777722040813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,768,0.04462577899297079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,65536,256,0.025768889321221247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,51200,0.8756444189283582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,65536,1.119231965806749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,65536,1.1594906912909615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,16384,0.2927937772538927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,12288,0.22099555863274467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,51200,0.9295351240370008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,16384,0.3022070990668403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,65536,51200,1.0722328821818035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,10240,0.17389510737525093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,10240,0.19160889254675972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,8192,0.14487111568450928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,12288,0.2253742218017578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,8192,0.1526684496137831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,7168,0.1244079934226142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,7168,0.13382132848103842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,16384,0.28171555201212567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,6144,0.10780177513758342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,12288,0.21358577410380045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,5120,0.09227466583251953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,6144,0.11744977368248834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,10240,0.18179644478691948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,8192,0.1508773300382826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,4096,0.08146755562888251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,7168,0.13501600424448648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,5120,0.09883999824523926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,3584,0.06651733318964641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,3584,0.07323733303281996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,6144,0.12081421746148004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,5120,0.10418755478329128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,4096,0.0897573365105523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,3072,0.05847822295294868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,2560,0.05213866631189982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,3584,0.08143555455737643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,3072,0.0651164452234904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,2048,0.04125510983996921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,2560,0.05738133192062378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,2048,0.05029777685801188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,2560,0.06645688745710585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,1536,0.03274666600757175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,1024,0.024832000335057575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,2048,0.06041422155168322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,1536,0.04138222336769104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,1536,0.05294933252864414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,1024,0.03365155392222934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,1024,0.045500444041358105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,512,0.013119999733236102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,4096,0.08224088615841336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,768,0.04134844409094916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,768,0.028765334023369685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,256,0.010159999959998662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,512,0.024932444095611572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,512,0.037696888049443565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,128,0.008995555341243744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,256,0.034006221426857844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,128,0.027122666438420612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,64,0.007280000381999546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,128,0.021669333179791767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,32,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,64,0.021225778592957392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,3072,0.07481866412692599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,32,0.026727999250094097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,51200,768,0.018983999888102215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,65536,0.38381867938571507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,51200,0.8771342171563042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,65536,0.4457937876383464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,51200,0.3087120056152344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,51200,256,0.02296177711751726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,16384,0.09981866677602132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,12288,0.07793688774108887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,51200,0.3518471188015408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,16384,0.1271253294414944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,10240,0.06652000215318468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,51200,65536,1.135544882880317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,10240,0.07837777667575412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,16384,0.12826666567060682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,8192,0.05592444207933214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,12288,0.10316622257232666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,12288,0.09070222245322333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,8192,0.06463111109203763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,7168,0.04829155405362447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,6144,0.0415653321478102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,7168,0.05753599935107761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,10240,0.09881510999467637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,8192,0.07841244671079847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,5120,0.03740266627735562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,7168,0.0709644423590766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,4096,0.03050222330623203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,6144,0.052192889981799655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,5120,0.0436480012204912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,6144,0.06526488727993436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,3584,0.027035555905765955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,5120,0.05840266413158841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,4096,0.037648889753553606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,3072,0.024005333582560223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,4096,0.05124622252252367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,65536,0.45938756730821395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,2560,0.020167110694779288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,3584,0.04752888944413927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,2048,0.017151999804708693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,3072,0.031544887357287936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,3072,0.0451217790444692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,1536,0.013626666532622443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,2560,0.02735022207101186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,51200,0.3600622283087836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,2048,0.03853066762288412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,2048,0.02490933405028449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,1024,0.010786666638321347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,768,0.00927022182279163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,1536,0.02168888847033183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,1536,0.03729688790109422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,1024,0.032264000839657254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,512,0.008290666672918532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,1024,0.01921866668595208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,768,0.029489778810077246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,256,0.0052328887912962176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,768,0.01750666730933719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,128,0.004573333180612988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,512,0.028212444649802312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,512,0.016170667277442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,64,0.004358222087224324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,256,0.02501511077086131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,256,0.0151582227812873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,16384,32,0.004550222307443619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,128,0.021993777818149988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,128,0.0147724449634552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,64,0.014852444330851236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,32,0.014444443914625378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,65536,0.2920160028669569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,51200,0.22853599654303658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,16384,0.08072621954811944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,65536,0.37746667861938477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,16384,3584,0.034289777278900146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,16384,0.10281333658430312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,12288,0.060086223814222545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,16384,2560,0.04134488768047757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,10240,0.05094933178689745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,12288,0.07971466912163629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,8192,0.04238933324813843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,10240,0.06763555606206258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,16384,0.12759466965993246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,12288,0.1020631127887302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,10240,0.08858578072653876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,7168,0.03827910953097873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,8192,0.05739466349283854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,6144,0.03347644540998671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,8192,0.07639911439683703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,7168,0.05248444279034933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,5120,0.028759999407662287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,6144,0.04690400097105238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,7168,0.07035999827914767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,4096,0.02477688921822442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,5120,0.03900977638032701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,51200,0.3505066765679254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,5120,0.05658311314053006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,4096,0.03366488880581326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,3584,0.02146666745344798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,4096,0.050382223394181996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,3072,0.01909955508179135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,51200,0.29558934105767143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,3584,0.029907554388046265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,3584,0.04667288727230496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,65536,0.44613509707980686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,2560,0.016191111670600045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,3072,0.02753066685464647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,3072,0.04394933250215319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,1536,0.011518222590287527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,2560,0.0407626661989424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,2560,0.025018667181332905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,2048,0.03822044531504313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,2048,0.022669333550665114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,1536,0.02018044392267863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,768,0.008292444050312042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,1024,0.031327111853493586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,1024,0.01793955597612593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,512,0.006579555571079254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,768,0.02812355425622728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,768,0.015930665863884818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,256,0.004942222187916438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,512,0.015285332997639975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,512,0.027104000250498455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,128,0.0042239998777707415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,256,0.025067556235525344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,256,0.014092443717850579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,64,0.004176889028814104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,6144,0.06439733505249023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,128,0.013991999957296582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,128,0.022643556197484333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,64,0.013767999907334646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,12288,32,0.014176888598336114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,65536,0.23424087630377877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,2048,0.014202665951516895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,1024,0.009744000103738572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,51200,0.18933244546254477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,65536,0.3365795612335205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,12288,1536,0.035409778356552124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,16384,0.06429155667622884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,51200,0.2609315448337131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,16384,0.09182755814658271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,12288,0.04957866668701172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,10240,0.04184622234768338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,16384,0.12695822450849745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,12288,0.10097689098782009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,10240,0.06066489219665527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,12288,32,0.00423911131090588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,8192,0.03645066751374139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,7168,0.03228888909022013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,10240,0.08802488777372573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,8192,0.05155822303560045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,6144,0.027223111854659185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,8192,0.07522133323881361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,7168,0.04713866776890225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,5120,0.023815999428431194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,7168,0.06957333617740206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,6144,0.041894220643573336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,6144,0.06343111064698961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,4096,0.020111999577946134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,5120,0.034783111678229436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,5120,0.0562373333507114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,3584,0.017549332645204332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,4096,0.029666665527555678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,4096,0.04981866810056898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,3072,0.015436444017622205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,3584,0.04572000106175741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,3584,0.027503111296229895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,2560,0.014044443766276041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,3072,0.025432889660199482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,12288,0.0715306666162279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,2048,0.012196444802814059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,1536,0.00999466660949919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,2560,0.03929333223236932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,2560,0.023315555519527856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,1024,0.008261333737108443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,2048,0.037294222248925105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,2048,0.021172444025675457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,768,0.0069120000633928515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,1536,0.03434400094879998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,1024,0.016586666305859882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,1024,0.029684444268544514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,512,0.005560889012283749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,768,0.027451554934183758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,256,0.004573333180612988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,512,0.026624000734753076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,512,0.014448889427714877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,128,0.0041911109454101985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,256,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,256,0.025400888588693406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,64,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,128,0.013295110729005603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,65536,0.4447306527031793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,128,0.021959111094474792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,10240,32,0.0038746665749284956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,64,0.013586666848924426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,32,0.013772444592581855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,65536,0.20324622260199654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,65536,0.2891155613793267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,3072,0.04310844341913859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,1536,0.018969777557584975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,51200,0.22450576888190377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,16384,0.05405333307054308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,10240,768,0.015472888946533203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,12288,0.04159733321931627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,16384,0.08045599857966106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,16384,0.0947493314743042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,12288,0.06297689014010958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,10240,0.035403556293911405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,10240,51200,0.3468968868255615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,8192,0.030454221698972914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,12288,0.0772613353199429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,51200,0.2415084573957655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,10240,0.053559998671213783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,7168,0.0258568889564938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,10240,0.06713866525226168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,8192,0.04614488946066963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,6144,0.022896000080638464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,8192,0.058687998188866504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,7168,0.04126844472355313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,5120,0.01959022217326694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,51200,0.15146756172180176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,7168,0.05442133214738634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,4096,0.016333333320087857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,6144,0.03666844301753574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,6144,0.05070399906900194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,3584,0.014539556370841132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,5120,0.03147644466824002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,5120,0.04455555478731791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,3072,0.013177778157922955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,4096,0.026945778065257605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,2560,0.011571555501884885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,3584,0.025237333443429735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,3584,0.03808622227774726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,4096,0.040728890233569674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,3072,0.02355555527740055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,2048,0.00997688869635264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,1536,0.008959111240175035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,2560,0.034246222840415105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,2560,0.02146666745344798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,2048,0.019674667053752475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,1024,0.0068986668354935115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,2048,0.03247822324434916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,1536,0.017140444782045152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,1536,0.029676444000667993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,1024,0.02677333354949951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,1024,0.015491555134455362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,512,0.0046826667255825466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,768,0.014475555883513557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,256,0.00416355538699362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,512,0.02404622236887614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,512,0.013947554760509066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,128,0.003547555456558863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,65536,0.30742311477661133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,256,0.013140444126394061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,256,0.02327644493844774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,64,0.0034888887570963967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,32,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,128,0.01276622215906779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,128,0.021292444732454088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,64,0.01276622215906779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,8192,32,0.013815110756291283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,65536,0.19659645027584502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,51200,0.14292711681789821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,65536,0.2848400010002984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,3072,0.03628888726234436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,16384,0.05212710963355171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,51200,0.22198932700686982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,12288,0.03960444529851278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,8192,768,0.005668444352017508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,16384,0.07913688818613689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,10240,0.034276445706685386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,16384,0.09354577461878459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,8192,768,0.025378665990299646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,8192,0.02868355645073785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,10240,0.05288088983959622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,12288,0.0765297810236613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,7168,0.025056888659795124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,8192,0.04470577836036682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,6144,0.021344888541433547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,65536,0.29992445309956867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,7168,0.040080888403786555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,51200,0.23802132076687285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,7168,0.053688890404171415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,5120,0.018553778529167175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,6144,0.035777777433395386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,6144,0.04946844445334541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,4096,0.01605955594115787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,5120,0.04416177670160929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,3584,0.0140684445699056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,5120,0.030184000730514526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,3072,0.012810666528013019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,4096,0.0403111113442315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,4096,0.026704889204767015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,3584,0.037963555918799505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,2560,0.01145155562294854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,3584,0.024775111012988623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,3072,0.03596355517705282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,3072,0.022960889670583937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,2048,0.010332444475756751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,2560,0.03389511174625821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,1536,0.009020444419648912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,2048,0.03254222207599216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,2048,0.018869333797030978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,1024,0.0069413334131240845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,1536,0.016756445169448853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,1536,0.0284862220287323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,768,0.006219555520349079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,1024,0.015116444892353482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,1024,0.02643555568324195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,512,0.0052844443255000645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,768,0.014483556151390076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,768,0.025059555967648823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,10240,0.06658489174313016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,256,0.004228444563017951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,512,0.013656888571050433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,512,0.02409066590997908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,128,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,256,0.02366488840844896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,256,0.013444444371594323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,64,0.003563555578390757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,7168,32,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,128,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,64,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,32,0.013410666750537025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,65536,0.16949955622355142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,51200,0.13068177964952257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,2560,0.02092444399992625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,65536,0.24754489792717826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,16384,0.0477182235982683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,7168,12288,0.06202489137649536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,51200,0.1881413327323066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,16384,0.07005244493484497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,12288,0.03767111235194736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,8192,0.058240003055996366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,12288,0.054845333099365234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,16384,0.09224800268809001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,12288,0.0748986668056912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,10240,0.030794666873084173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,8192,0.026127111580636766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,65536,0.29682932959662545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,51200,0.23529333538479277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,7168,128,0.020220445262061227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,10240,0.04634133312437269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,7168,0.02335022224320306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,8192,0.03885866536034478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,10240,0.06584178076850043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,6144,0.020190222395790946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,8192,0.0572648909356859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,5120,0.017103110750516255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,7168,0.035100443495644465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,4096,0.014732443624072604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,7168,0.0532240006658766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,6144,0.031898667414983116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,6144,0.049654222197002836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,5120,0.043495111995273165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,5120,0.02716622253259023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,3072,0.01241422196229299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,4096,0.04051733348104689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,4096,0.02437244521247016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,2560,0.010863111250930362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,3584,0.037751999166276716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,3584,0.022672888305452134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,3072,0.021207999851968553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,3072,0.03594133257865906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,1536,0.008265777594513362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,2560,0.01964000033007728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,2560,0.033788445923063494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,2048,0.017278222574128043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,1024,0.006643555644485686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,2048,0.032171554035610624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,1536,0.015838222371207345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,768,0.005696889013051987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,1536,0.028592000404993694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,1024,0.026397332549095154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,1024,0.014431110686726041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,512,0.00452533322903845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,256,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,768,0.014116444521480136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,512,0.024294222394625347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,512,0.013464888764752282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,128,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,256,0.012784000072214337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,256,0.022667555345429316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,64,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,32,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,128,0.01994222237004174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,128,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,64,0.012429333395428128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,6144,32,0.013748444616794586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,65536,0.1467884381612142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,51200,0.1235111157099406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,3584,0.013788444300492605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,16384,0.04319733381271362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,65536,0.23906132909986708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,51200,0.18809155623118082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,12288,0.03382844395107693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,6144,2048,0.009372444616423713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,16384,0.06853155295054118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,16384,0.09094133641984727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,12288,0.05351288782225715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,12288,0.07459288835525513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,10240,0.04454311066203647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,8192,0.02421422302722931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,65536,0.29478221469455296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,10240,0.06503022379345365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,7168,0.020652444826232064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,6144,768,0.02439555525779724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,6144,0.01920088960064782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,8192,0.03790844480196635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,7168,0.03445600138770209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,7168,0.05302933189604017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,5120,0.016514667206340365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,6144,0.04907377892070346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,6144,0.03137777911292182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,4096,0.013935110635227628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,5120,0.043559110826916166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,3584,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,4096,0.023753777146339417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,4096,0.039339555634392634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,3072,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,3584,0.0373617774910397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,3584,0.022279111875428095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,2560,0.010611555642551847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,3072,0.02107288936773936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,3072,0.035671111610200666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,2048,0.009304888546466827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,2560,0.03220266766018338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,2560,0.0188755558596717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,10240,0.02902311086654663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,1536,0.007712889048788283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,2048,0.017529777354664274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,2048,0.030052443345387776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,1024,0.006256888724035687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,1536,0.015442666080262927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,51200,0.23218488693237305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,1024,0.014314666390419006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,1024,0.025585777229732935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,512,0.004544888933499654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,8192,0.05685422155592176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,768,0.0243493335114585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,768,0.013803555733627744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,256,0.004105777790149053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,512,0.013080889152155982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,512,0.024674667252434626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,128,0.003822222352027893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,256,0.022611555125978258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,256,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,5120,0.027116444375779893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,64,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,128,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,32,0.0035333335399627686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,64,0.012705778082211813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,5120,32,0.012350222302807702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,65536,0.10965422126981948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,51200,0.0929937760035197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,65536,0.20241867171393502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,16384,0.03760711020893521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,51200,0.1576871077219645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,16384,0.05805777841144138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,1536,0.02826133370399475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,5120,768,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,16384,0.0885324411922031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,10240,0.025389333566029865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,65536,0.2856275505489773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,51200,0.2239760027991401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,12288,0.07209955321417914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,10240,0.03784266776508755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,10240,0.06328977478875054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,7168,0.018789332773950364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,8192,0.05533688929345873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,5120,128,0.020225778222084045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,6144,0.016136000553766888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,7168,0.02993333339691162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,7168,0.05150666501786974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,5120,0.014319111903508505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,6144,0.0478168891535865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,6144,0.0277511113219791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,4096,0.013382222089502545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,5120,0.023932443724738225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,5120,0.042484445704354175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,3584,0.009707555174827576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,4096,0.02142222225666046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,4096,0.039093332158194646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,3072,0.009307555854320526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,3584,0.020589333441522386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,3584,0.03614577651023865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,2560,0.008263111114501953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,3072,0.018883556127548218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,3072,0.03457066747877333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,2048,0.007603555917739868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,2560,0.03269955515861511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,2560,0.01720177796151903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,12288,0.029990222718980577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,1536,0.006280000011126201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,1024,0.004927999857399198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,2048,0.029846221208572388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,2048,0.015582222077581616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,12288,0.0441964434252845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,1536,0.028059555424584284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,768,0.00453244439429707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,8192,0.021083555287784998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,1024,0.025460445218616064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,1024,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,512,0.003927111211750242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,256,0.0035333335399627686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,768,0.013456888496875763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,512,0.024678222007221643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,512,0.012720000412729053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,128,0.003232888877391815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,256,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,256,0.0236791107389662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,64,0.0031306667046414483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,4096,32,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,128,0.012038222617573209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,128,0.02014044423898061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,64,0.012406222522258759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,65536,0.10012622012032403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,32,0.01237066669596566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,51200,0.08073777622646756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,65536,0.19918578200870088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,16384,0.033681776788499616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,51200,0.155114663971795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,16384,0.05642311440573799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,16384,0.0881991121504042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,12288,0.028536889288160536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,1536,0.014551111393504672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,65536,0.28404532538519967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,10240,0.02457155618402693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,51200,0.22401067945692274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,12288,0.043841779232025146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,8192,0.02022133270899455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,4096,768,0.025016888976097107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,12288,0.07159022490183513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,10240,0.037328001525666975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,4096,8192,0.03284444411595663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,7168,0.01864355636967553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,10240,0.06294311417473687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,6144,0.015818667080667283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,8192,0.031994667318132185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,8192,0.05491111013624403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,7168,0.05119911167356703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,6144,0.047351999415291675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,6144,0.027699554959932964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,4096,0.01124622258875105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,3584,0.01069866700304879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,5120,0.023588443795839947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,5120,0.042318221595552236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,3072,0.010040889183680216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,4096,0.03851111067665948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,4096,0.020942222740915086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,3584,0.03587999939918518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,2560,0.00889066689544254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,3072,0.018357333209779527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,3072,0.03462844424777561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,2048,0.007975999679830339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,2560,0.031034668286641438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,2560,0.016470222009552848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,1536,0.006534222099516127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,2048,0.02918133470747206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,2048,0.015461333923869662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,1024,0.005227555417352253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,1536,0.01441422270403968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,768,0.00489688871635331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,1024,0.013528889252079858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,1024,0.025467554728190105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,512,0.00443111111720403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,768,0.01330044451687071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,768,0.02478666603565216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,256,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,512,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,512,0.0239991115199195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,128,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,256,0.012108444339699216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,5120,0.014005333185195923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,7168,0.02960977620548672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,64,0.003145777723855443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,128,0.012082666986518435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3584,32,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,128,0.019654222660594516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,64,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,65536,0.08483822478188409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,32,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3584,3584,0.019596444235907663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,51200,0.06587644418080647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,16384,0.03199288911289639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,65536,0.1938577757941352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,51200,0.1521057817671034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,12288,0.026526222626368206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,16384,0.05450310972001818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,16384,0.08773599730597602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,10240,0.021200888686709937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,1536,0.028435554769304063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,12288,0.04245511028501722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,8192,0.01757777730623881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,12288,0.07160622543758817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,10240,0.0627653333875868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,10240,0.036659555302725896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,51200,0.22226577334933809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,7168,0.016361777981122334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,65536,0.2834560076395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,8192,0.031832890378104314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,6144,0.014354666074117025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,5120,0.012709333664841123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,7168,0.02951822347111172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,7168,0.051164444949891835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,6144,0.04717688759167989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,4096,0.010647999743620554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,6144,0.027134221461084154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,5120,0.0233271105421914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3584,256,0.022685334086418152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,4096,0.03872977693875631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,4096,0.020132443971104093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,3072,0.008663111262851292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,3584,0.019000000423855253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,3584,0.03447555502255758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,2560,0.008289777570300633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,3072,0.017858665850427415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,3072,0.033124443557527326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,2048,0.007584888901975419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,2560,0.016173332929611206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,2560,0.030605332718955144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,1536,0.005882666756709416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,2048,0.0291244453854031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,2048,0.01555199921131134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,1024,0.004548444516128964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,1536,0.027454222242037456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,768,0.0041724443435668945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,1024,0.013803555733627744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,1024,0.02573777735233307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,512,0.0038782221575578055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,768,0.013083555632167392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,768,0.025213332639800176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,256,0.003544888976547453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,512,0.012773333324326409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,8192,0.05464799867735969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,512,0.0236835562520557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,128,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,256,0.012464889221721225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,64,0.0029013332807355454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,128,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,128,0.020562666985723708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,32,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,5120,0.04226488868395487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,64,0.012180444267061023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,65536,0.07380800114737616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,32,0.012381333443853589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,51200,0.06026222308476766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,65536,0.19257067309485543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,16384,0.02552000019285414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,51200,0.15074843830532497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,3072,1536,0.014206222361988492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,16384,0.05272266599867079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,12288,0.021928000781271193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,65536,0.2817182275984022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,51200,0.22169600592719185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,10240,0.0195768889453676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,12288,0.04176355401674906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,10240,0.03619733452796936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,8192,0.015279110934999255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,10240,0.06243999799092611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,7168,0.013754666679435305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,3072,256,0.023071999351183575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,8192,0.054541332854164966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,8192,0.031552000178231135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,6144,0.012099555797047086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,7168,0.029319110843870375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,3072,3584,0.009651555783218807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,5120,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,6144,0.026728888352711994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,6144,0.047170665529039174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,4096,0.011698666546079846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,5120,0.04067644476890564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,5120,0.022521777285469904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,3584,0.009660444325870937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,4096,0.020317332612143624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,4096,0.03634577658441331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,3072,0.00907199995385276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,3584,0.018551111221313477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,3584,0.03454577922821045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,2560,0.008284444610277811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,3072,0.01736088924937778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,2048,0.007265778051482306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,2560,0.016180444094869826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,2560,0.03015022145377265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,16384,0.08682933118608262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,1536,0.006000888844331105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,2048,0.015095111396577625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,2048,0.029519110918045044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,1024,0.0052675555149714155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,1536,0.02776177724202474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,1536,0.014451555079884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,768,0.004552888787455029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,1024,0.013777777552604675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,1024,0.02502577834659153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,512,0.003916444463862313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,768,0.025006221400366888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,768,0.013191999660597907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,256,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,512,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,512,0.024382222029897902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,128,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,256,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,256,0.022294221652878657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,64,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,128,0.02026844521363576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,128,0.012062222593360476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2560,32,0.002970666728085942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,64,0.012038222617573209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,65536,0.05918400155173408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2560,32,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,3072,0.032587554719712995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,51200,0.050385776493284434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,65536,0.1537084447013007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,16384,0.022685334086418152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,51200,0.11730666955312093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,12288,0.07105777661005656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,16384,0.042697777350743614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,65536,0.27926399972703725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,12288,0.01979377700222863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,51200,0.2204115523232354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,16384,0.08637511067920262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,10240,0.01868799991077847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,8192,0.0141004439857271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,10240,0.029855999681684706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,12288,0.034499555826187134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,12288,0.0705582234594557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,8192,0.0265600002474255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,7168,0.013400000002649097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,8192,0.05435644586881002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,6144,0.011811555259757571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2560,7168,0.05058222346835666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,5120,0.01033688916100396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,7168,0.024732444021436904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,6144,0.04709066616164314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,6144,0.022359111242824133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,4096,0.009309333231714036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,5120,0.0400257772869534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,3584,0.008512000242869059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,5120,0.019547555181715224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,3072,0.007635555333561367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,4096,0.036102222071753606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,4096,0.017871111631393433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,2560,0.006968888971540663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,3584,0.034259554412629865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,3584,0.016547555724779766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,2048,0.006173333360089197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,3072,0.032553778754340276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,2560,0.029680000411139593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,2560,0.014803555276658801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,1536,0.005260444349712796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,2048,0.014075555735164218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,2048,0.028772443532943726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,1024,0.0041991112132867174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,1536,0.013702222042613559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,1536,0.027300443914201524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,768,0.0041857775714662345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,1024,0.025370667378107708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,512,0.003826666623353958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,768,0.025262221693992615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,768,0.012478222449620565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,256,0.003257777748836411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,512,0.01238844460911221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,512,0.025008888708220586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,10240,0.06163555383682251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,128,0.0032248888164758682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,256,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,64,0.00313688897424274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,128,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,128,0.02069422271516588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,7168,0.050629334317313306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,2048,32,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,65536,0.04761688907941183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,64,0.011704000333944956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,32,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,51200,0.04122489028506809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,65536,0.15008621745639378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,3072,0.015789333317014907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,16384,0.01852799952030182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,51200,0.11768889427185059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,12288,0.0162426663769616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,16384,0.04182755615976122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,16384,0.08573333422342937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,65536,0.27809511290656197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,51200,0.21978488233354357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,10240,0.014944000376595391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,12288,0.03394488824738397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,2048,1024,0.012784000072214337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,12288,0.06987111435996161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,10240,0.06153421931796604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,7168,0.01424800025092231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,10240,0.029849777619043987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,6144,0.011396444506115384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,8192,0.0535715553495619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,7168,0.04979022343953451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,7168,0.02392622166209751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,5120,0.010236444572607676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,6144,0.022257778379652236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,6144,0.04531200064553154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,2048,256,0.02296177711751726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,4096,0.008513777620262569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,5120,0.018920888503392536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,5120,0.04115822248988681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,3584,0.007975111405054728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,4096,0.03595733311441209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,4096,0.017097777790493436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,3072,0.006993778049945831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,3584,0.016466667254765827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,3584,0.03358755509058634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,2560,0.0070675553547011475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,3072,0.015492444237073263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,3072,0.03208622336387634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,2048,0.006604444649484422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,2560,0.014482667048772177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,2560,0.029890666405359905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,1536,0.005903999838564131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,2048,0.013766222529941134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,1024,0.004924444274769889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,1536,0.013428444663683573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,8192,0.014130666851997375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,1024,0.012416000167528788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,1024,0.025703110628657874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,768,0.004238222208287981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,512,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,768,0.024774221910370722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,8192,0.02605244517326355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,768,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,256,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,512,0.012103999654452005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,128,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,512,0.02398577829202016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,256,0.011767110890812345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,256,0.023316444622145757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,64,0.0029351111087534162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1536,32,0.002871111035346985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,128,0.020233778489960563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,128,0.01148088855875863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,65536,0.03791022300720215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,64,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1536,32,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,51200,0.030020445585250854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,65536,0.1476586659749349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,16384,0.015798222687509324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,51200,0.11335110664367676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,2048,0.028559111886554297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,12288,0.013448889056841532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,51200,0.2188133398691813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,65536,0.2770933310190837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,16384,0.041286223464541964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,10240,0.013054221868515015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1536,1536,0.027098667290475633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,16384,0.08532088994979858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,8192,0.012489777472284106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,7168,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,12288,0.06993333498636882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,12288,0.03348088926739163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,10240,0.06127466758092245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,6144,0.011058666639857821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,8192,0.05332888828383552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,5120,0.009719111025333405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,7168,0.023207111491097346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,6144,0.04449866546524895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,6144,0.021292444732454088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,4096,0.008995555341243744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,5120,0.03926488757133484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,5120,0.018933332628673978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,3584,0.008296888735559251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,4096,0.03573688864707947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,4096,0.016894222961531747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,3072,0.007737778127193451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,3584,0.01642311116059621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,3584,0.03360533383157518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,2560,0.006603555546866522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,3072,0.03193599979082743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,2048,0.006224888894293044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,2560,0.01455200049612257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,2560,0.029926220575968426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,1536,0.0052435555391841466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,2048,0.013693333499961428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,2048,0.028778665595584448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,1024,0.0041911109454101985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,1536,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,1536,0.027083555857340496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,768,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,1024,0.012777778009573618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,1024,0.025387555360794067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,512,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,768,0.012107555237081317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,768,0.025055999557177227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,256,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,512,0.012216889195972018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,7168,0.04960088928540548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,128,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,256,0.01202755586968528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,256,0.0229759994480345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,64,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,128,0.011713777979214987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,128,0.020629333125220407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,1024,32,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,64,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,3072,0.015464888678656684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,32,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,65536,0.033202668031056724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,51200,0.027127110295825537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,65536,0.14602488941616482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,51200,0.11391822497049968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,16384,0.0188755558596717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,65536,0.27818844053480357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,51200,0.21967377927568224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,16384,0.08529333273569743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,10240,0.0288080010149214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,12288,0.01460977726512485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,1024,8192,0.02534488836924235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,10240,0.013806222213639153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,1024,512,0.023677332533730402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,8192,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,12288,0.0696106685532464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,10240,0.06086577971776327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,10240,0.02846577763557434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,7168,0.011419555379284753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,8192,0.02490844494766659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,8192,0.053299556175867714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,6144,0.010440888504187265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,7168,0.023000000251664057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,5120,0.009773333039548662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,6144,0.04490400022930569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,6144,0.02107644412252638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,4096,0.007974222302436829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,5120,0.039136889908048846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,5120,0.018589332699775696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,3584,0.007150222029950883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,4096,0.01682577696111467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,4096,0.03587733374701606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,3072,0.006559999866618051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,3584,0.016307555966907077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,3584,0.0335822237862481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,2560,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,3072,0.015486222174432544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,3072,0.03184444374508328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,2048,0.0052177777720822235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,2560,0.01443377799457974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,1536,0.004916444420814514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,2048,0.013584888643688627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,16384,0.04009600149260627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,1024,0.004226666771703296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,1536,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,1536,0.026753778258959453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,768,0.003920000046491623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,12288,0.03299199872546726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,1024,0.024714666936132643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,1024,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,512,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,768,0.012150222228633033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,768,0.025072889195548162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,256,0.0032808888289663526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,512,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,512,0.023317333724763658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,128,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,7168,0.04777955677774218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,256,0.022614222433831956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,64,0.0029208889851967492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,256,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,768,32,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,128,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,128,0.01961688862906562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,65536,0.02410488824049632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,64,0.011431111229790581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,768,32,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,65536,0.14516977469126383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,51200,0.11146044731140137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,65536,0.27686044904920787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,2560,0.029834667841593426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,12288,0.014183999763594734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,16384,0.03968711031807794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,768,2048,0.02882222334543864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,16384,0.08449955781300862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,10240,0.012415111064910889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,12288,0.0322364436255561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,8192,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,10240,0.027443556321991816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,10240,0.06052888764275444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,7168,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,8192,0.024131556351979572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,8192,0.0507226652569241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,6144,0.01020088874631458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,7168,0.04740800129042732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,7168,0.02251911163330078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,5120,0.008970666262838576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,6144,0.020956445071432326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,6144,0.043875555197397866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,4096,0.00832088871134652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,5120,0.018567999203999836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,5120,0.0391226675775316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,3584,0.006945778098371293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,51200,0.01978933314482371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,4096,0.03529955612288581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,3072,0.006309333360857434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,4096,0.01720533271630605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,3584,0.016169778174824186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,3584,0.03361422154638503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,2560,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,3072,0.03194488750563727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,3072,0.015450666348139444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,16384,0.01204177737236023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,2048,0.005572444448868434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,1536,0.0048942222363419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,2560,0.014482667048772177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,2560,0.029842668109469946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,51200,0.21932266818152535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,1024,0.004168888760937585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,2048,0.02849600050184462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,2048,0.013579555683665805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,768,0.0038613333470291565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,1536,0.027801778581407335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,1536,0.013448889056841532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,512,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,1024,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,1024,0.025097777446111042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,256,0.003206222214632564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,768,0.012131555212868584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,768,0.023981332778930664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,128,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,512,0.02368800010946062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,512,0.012226666841242047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,12288,0.0690844456354777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,256,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,512,32,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,65536,0.02180533276663886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,128,0.01959466603067186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,51200,0.01949155496226417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,64,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,32,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,16384,0.010379555324713389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,65536,0.13998133606380886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,51200,0.11069955428441365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,65536,0.27686044904920787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,16384,0.039459556341171265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,12288,0.00997511131895913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,51200,0.21922222773234049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,16384,0.08380533589257134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,12288,0.06760978036456637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,12288,0.03115733464558919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,10240,0.027463111612531874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,8192,0.008615111311276754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,10240,0.058782219886779785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,7168,0.00795377790927887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,8192,0.02409422232045068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,8192,0.051141334904564746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,7168,0.022963555322753057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,7168,0.04724533359209696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,6144,0.007616889145639207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,5120,0.008291555775536431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,6144,0.020941333638297185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,4096,0.007599111232492659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,512,256,0.023618666662110224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,4096,0.01717511150572035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,512,128,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,3584,0.006962666908899943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,4096,0.036064889695909284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,3072,0.006474666711356904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,3584,0.015809777710172866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,3072,0.015450666348139444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,10240,0.009305777649084726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,2560,0.005877333382765452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,2560,0.030219554901123047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,2560,0.014156444205178155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,2048,0.0052871112194326185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,2048,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,1536,0.00463377767139011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,6144,0.04351822204060025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,5120,0.03901866740650601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,1536,0.013088888592190213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,1024,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,1536,0.02683111031850179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,768,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,1024,0.02574133376280467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,1024,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,512,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,768,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,768,0.024668445189793903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,256,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,3584,0.03392088744375441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,512,0.01202222208182017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,512,0.023657777243190344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,128,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,256,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,3072,0.031459556685553655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,64,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,128,0.01956888867749108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,256,32,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,128,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,65536,0.016346666547987197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,64,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,32,0.011133333047231039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,51200,0.014567111929257711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,65536,0.1421120034323798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,2048,0.028841776980294123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,65536,0.2774435679117839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,51200,0.10911999808417426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,16384,0.009663999908500248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,12288,0.008349333372380998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,256,5120,0.018371555540296767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,51200,0.21817955705854628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,16384,0.03865955604447259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,10240,0.00904177791542477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,12288,0.03122755553987291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,8192,0.00834222220712238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,12288,0.06658399767345853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,10240,0.058555556668175586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,7168,0.00795022232664956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,8192,0.05051733387841118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,7168,0.022015111313925848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,7168,0.04671733246909248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,6144,0.0073831114504072405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,256,256,0.023013333479563396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,5120,0.008023111356629265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,6144,0.04367466767628988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,6144,0.02057422200838725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,4096,0.007305777735180325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,5120,0.018561777141359117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,5120,0.03899733225504557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,4096,0.01648533344268799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,4096,0.0353724459807078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,3072,0.006707555717892117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,3584,0.015816888875431485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,3584,0.03308711118168301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,2560,0.00655733338660664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,3072,0.03156266609827677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,16384,0.08234666453467475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,2048,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,2560,0.014067555467287699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,2560,0.029800001117918227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,1536,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,10240,0.027464888162083093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,2048,0.02843911117977566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,2048,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,1024,0.0038924444880750445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,8192,0.023863111933072407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,1536,0.0127697777416971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,1536,0.027412444353103638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,1024,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,1024,0.025052444802390203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,512,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,768,0.024720888998773363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,768,0.01181688904762268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,256,0.0028479999552170434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,512,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,512,0.02370044423474206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,128,0.0025600000388092464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,256,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,64,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,128,0.011056889262464313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,128,0.019312888383865356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,3584,0.007311111523045435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,32,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,65536,0.014117333624098035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,64,0.011015999648306104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,51200,0.012874667015340594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,32,0.011020444333553314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,65536,0.14273866017659506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,51200,0.10897244347466363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,12288,0.008276444342401292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,16384,0.03758577836884393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,10240,0.007653333246707916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,8192,0.007257777783605788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,12288,0.03088266650835673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,10240,0.027111111415757075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,7168,0.006934222247865465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,8192,0.02366133365366194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,6144,0.006574222197135289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,5120,0.005956444475385878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,128,768,0.003573333223660787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,7168,0.02199111051029629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,4096,0.006591111007663939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,6144,0.020617778102556866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,3584,0.006524444454246097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,5120,0.018215111560291715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,3072,0.005946666830115848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,2560,0.006601777755551868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,4096,0.016207110550668504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,2048,0.005950222412745158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,3072,0.015133332875039844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,224,128,256,0.0226275556617313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,2560,0.01439377831088172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,1536,0.00453599997692638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,1024,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,2048,0.013251555462678274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,1536,0.01293333371480306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,1024,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,768,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,16384,0.009664889011118147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,256,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,128,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,512,0.01204177737236023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,128,3072,0.01484444406297472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,64,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,256,0.012079111403889127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,32,0.0024906665914588505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,128,0.01107911103301578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,65536,0.014056000444624158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,64,0.011702222128709158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,51200,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,32,0.011401777466138205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,16384,0.009002666506502364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,65536,0.14133511649237737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,12288,0.007811555431948767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,16384,0.03879288832346598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,10240,0.0074542222751511475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,12288,0.030753778086768255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,64,3584,0.015847999188635085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,8192,0.00700800038046307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,7168,0.006909333169460297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,10240,0.02748888896571265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,6144,0.006383111079533895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,768,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,8192,0.0237137774626414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,5120,0.006247111078765657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,7168,0.02199733257293701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,4096,0.005964444329341252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,64,512,0.0034728890491856467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,3584,0.006250666661394968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,3072,0.006235555642180973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,5120,0.018254222141371835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,4096,0.016169778174824186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,3584,0.01585244470172458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,3072,0.015127110812399121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,1536,0.004541333350870344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,2560,0.013829333086808523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,1024,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,2048,0.013413333230548434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,768,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,1536,0.012723555167516073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,512,0.003265777809752358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,1024,0.012431999875439538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,256,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,768,0.012215110990736218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,128,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,512,0.011713777979214987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,51200,0.10663733217451309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,64,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,256,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,32,0.0025173332542181015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,128,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,64,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,32,0.011038222246699862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,224,32,6144,0.020831111404630873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,2560,0.006256000035338932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,16384,0.39595821168687606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,16384,0.36408087942335343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,12288,0.30342311329311794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,10240,0.24557333522372773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,10240,0.2286142243279351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,8192,0.20305955410003662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,51200,1.1073111428154838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,7168,0.17636088530222574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,51200,1.2477519777086046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,8192,0.18525777922736275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,6144,0.15169155597686768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,5120,0.13167556126912436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,7168,0.16135199864705405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,6144,0.14112533463372126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,3584,0.09947288698620266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,4096,0.1076364450984531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,3072,0.08697155449125503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,224,32,2048,0.005947555518812603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,2560,0.07217244307200114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,3584,0.08882666958702935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,3072,0.07722310887442695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,4096,0.10116977824105157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,2560,0.06875377893447876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,2048,0.058851553334130176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,1024,0.033391998873816595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,1536,0.04284800092379252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,12288,0.26899467574225533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,768,0.025388444463411968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,512,0.018593778212865193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,1536,0.04822488956981235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,256,0.01312888910373052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,512,0.03311555584271749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,768,0.03388444582621256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,128,0.010625777973069085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,256,0.025780444343884785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,1024,0.03907555672857497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,64,0.00831822223133511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,128,0.024622221787770588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,64,0.024060444699393377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,32,0.0243511117166943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,65536,5120,0.11927110619015163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,16384,0.32552001211378306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,2048,0.058803558349609375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,12288,0.2458195686340332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,16384,0.29048000441657174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,12288,0.21528177791171602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,51200,0.9094088872273763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,51200,1.0044897927178276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,10240,0.19959378242492676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,65536,32,0.008559111091825698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,65536,1.1469199922349718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,65536,1.2865751054551866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,10240,0.18338310718536377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,8192,0.15149866210089788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,6144,0.12797599368625218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,7168,0.1322880056169298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,7168,0.14351733525594076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,4096,0.08725688854853313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,5120,0.0969582200050354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,3584,0.07579377624723646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,4096,0.0815991097026401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,3584,0.07269866598976983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,6144,0.11585599846310085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,2560,0.05556533071729872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,3072,0.06600711080763075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,3072,0.06380622254477607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,2560,0.056623107857174344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,1536,0.03594577643606398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,1024,0.026696888936890498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,768,0.020598222812016804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,2048,0.0491466654671563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,1536,0.0410426656405131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,512,0.01479822231663598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,256,0.01072266697883606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,1024,0.03358666764365302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,128,0.008970666262838576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,256,0.022954665952258643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,512,0.027278222971492346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,64,0.007268444531493717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,128,0.021597334080272253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,32,0.007271111011505127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,5120,0.10468622048695882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,64,0.02161600026819441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,32,0.021280889709790547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,65536,0.3754417896270752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,51200,0.2968897819519043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,16384,0.0983733336130778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,2048,0.04589688777923584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,51200,0.341248008939955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,65536,0.4317759937710232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,10240,0.06332000096638997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,12288,0.07522488964928521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,12288,0.08733422226376003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,16384,0.11410044299231635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,8192,0.05317777726385328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,10240,0.07466044690873888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,7168,0.04665333363744947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,6144,0.040037333965301514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,51200,8192,0.1649279991785685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,8192,0.06407822502983941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,5120,0.035028444396124944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,7168,0.057051552666558154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,4096,0.030096001095241968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,51200,768,0.02864711152182685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,3072,0.023031110564867657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,4096,0.03722133239110311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,2560,0.0192239996459749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,6144,0.04840888910823398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,5120,0.04236977630191379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,3072,0.030305776331159804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,1536,0.013059555656380124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,1024,0.01020088874631458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,2560,0.027437332603666518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,2048,0.02423022190729777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,1536,0.02148888839615716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,768,0.008828444613350762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,512,0.007349333001507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,1024,0.01888533267709944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,768,0.017503110898865592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,512,0.017509332961506315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,128,0.004547555413511065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,256,0.015127110812399121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,128,0.014505777094099255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,32,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,64,0.014504000544548035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,32,0.01575911045074463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,65536,0.29174666934543186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,3584,0.026191110412279766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,16384,3584,0.03406755460633172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,65536,0.35937245686848956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,2048,0.016336888074874878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,16384,0.07613333066304524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,12288,0.060277336173587374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,51200,0.2835786607530382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,256,0.005256888767083486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,16384,0.09912977615992229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,12288,0.07636266946792603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,8192,0.042895999219682485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,7168,0.03729688790109422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,16384,64,0.004250666747490565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,6144,0.03273866573969523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,8192,0.056800888644324414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,10240,0.06557333469390869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,7168,0.05105333195792305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,5120,0.02825777729352315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,4096,0.02442933287885454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,3584,0.021270222134060327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,6144,0.04323110977808634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,3072,0.019055111540688407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,5120,0.0379342238108317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,4096,0.03239911132388645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,2560,0.015830222103330824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,3584,0.030072887738545735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,3072,0.027181333965725366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,1536,0.011587555209795633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,2560,0.024700444605615404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,2048,0.02215822206603156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,1024,0.00965244405799442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,768,0.00832088871134652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,1536,0.020184000333150227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,512,0.006605333338181178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,1024,0.017663111289342243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,768,0.016188444362746347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,51200,0.22745688756306967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,256,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,512,0.015816888875431485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,128,0.004535111288229625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,64,0.003912888881233004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,256,0.014136888914638095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,128,0.0138568886452251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,32,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,32,0.013471999930010902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,12288,64,0.013779555757840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,51200,0.20597778426276314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,16384,0.07269422213236491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,65536,0.2633662223815918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,12288,0.0565626687473721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,65536,0.3187217712402344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,10240,0.049175110128190785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,51200,0.25047556559244794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,16384,0.0885573360655043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,2048,0.013722666435771518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,12288,0.06799733638763428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,10240,0.05908089213901096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,7168,0.03973599937227037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,6144,0.03340177734692892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,5120,0.027948445743984644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,4096,0.02381333377626207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,7168,0.04579200016127693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,6144,0.03886133432388306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,5120,0.03417866759830051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,3584,0.021186666356192693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,3072,0.018464888135592144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,2560,0.016235555211702984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,3584,0.0273635552989112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,2048,0.014367111855083041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,3072,0.025016888976097107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,2560,0.022989332675933838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,1536,0.01202311118443807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,12288,10240,0.05017866690953573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,1024,0.009233777721722921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,768,0.0076142218377855085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,2048,0.020986666282018025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,1536,0.018582221534517076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,512,0.005933333188295364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,256,0.004866666677925321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,1024,0.01651822196112739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,768,0.015448000695970325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,128,0.004234666625658671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,64,0.003916444463862313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,512,0.015489778584904142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,256,0.013757333159446716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,32,0.004018666843573253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,64,0.013452444639470843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,32,0.01519466605451372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,10240,8192,0.04070666763517592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,65536,0.22246487935384116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,8192,0.050993776983684964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,16384,0.058697779973347984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,65536,0.27166223526000977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,12288,0.04580977890226576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,4096,0.03018222252527873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,51200,0.21654755539364287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,10240,0.03857422206136916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,8192,0.03273066547181871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,7168,0.028505778974956934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,12288,0.059976001580556236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,8192,0.04480444391568502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,6144,0.02532800038655599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,5120,0.021864000293943617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,7168,0.03997777899106344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,6144,0.03433155682351854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,3584,0.015835555063353646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,5120,0.030185778935750324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,4096,0.026335999369621277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,10240,128,0.01312888910373052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,3584,0.02461244497034285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,2560,0.012351999680201212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,2048,0.010674667027261523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,3072,0.022950222094853718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,1536,0.009203555683294931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,2048,0.019311111834314134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,1024,0.007257777783605788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,51200,0.17333689000871447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,768,0.00601244428091579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,1536,0.01717333330048455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,512,0.004899555610285865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,1024,0.015170666906568738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,768,0.014870221416155497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,256,0.004081777814361784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,512,0.014450665977266101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,128,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,10240,0.052744001150131226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,256,0.013125333521101209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,64,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,32,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,128,0.012792888614866467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,4096,0.01850488947497474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,64,0.013122667041089801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,32,0.013090666797426013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,65536,0.20746044317881265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,8192,3072,0.014462222655614218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,16384,0.05554844604598152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,51200,0.1624177826775445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,65536,0.2686844401889377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,51200,0.21225867006513807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,16384,0.07558044460084704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,10240,0.03692355420854356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,2560,0.021329777108298406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,12288,0.05902666515774197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,8192,0.031195554468366835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,7168,0.02722666660944621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,6144,0.02402399977048238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,10240,0.051629334688186646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,8192,0.043354666895336576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,5120,0.02071644365787506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,7168,0.03872799873352051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,4096,0.017550221747822232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,8192,16384,0.07653422488106622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,3584,0.015287111202875773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,6144,0.03298222356372409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,2560,0.012016889121797351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,3072,0.013659555878904132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,4096,0.026183111800087824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,2048,0.010752889017264048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,3584,0.024417777856190998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,1536,0.008712000317043727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,1024,0.006913777854707506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,2560,0.020845333735148113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,768,0.005787555542257097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,2048,0.018930666976504855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,512,0.00490399988161193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,1536,0.016543111867374845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,1024,0.015059555570284525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,256,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,128,0.003830222205983268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,768,0.01482311056719886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,64,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,512,0.014480888843536377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,256,0.013071999781661563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,32,0.003530666646030214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,128,0.012776888906955719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,64,0.01278133359220293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,32,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,65536,0.1734639936023288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,7168,12288,0.04342933495839437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,16384,0.0518124434683058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,51200,0.13913688394758436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,65536,0.23138843642340767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,12288,0.042246222496032715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,10240,0.03545244534810384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,51200,0.18193422423468697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,16384,0.06624444325764973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,8192,0.029584887954923842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,12288,0.05166133244832357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,7168,0.026383111874262493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,10240,0.04520000020662943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,6144,0.02307111190425025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,8192,0.03778577844301859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,5120,0.029155555698606703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,7168,0.03425688876046075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,4096,0.016167999969588388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,6144,0.029327111111746892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,7168,3072,0.022587555978033278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,3584,0.015103111664454142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,5120,0.02622311148378584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,3072,0.013345777988433838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,2560,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,4096,0.023353776997990076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,2048,0.01034577770365609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,3584,0.02199111051029629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,1536,0.00866844422287411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,1024,0.0069057775868309875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,3072,0.02092711130777995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,2560,0.0192577772670322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,768,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,2048,0.017102221647898357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,512,0.004854222138722737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,256,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,128,0.0034862222770849862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,1024,0.014429334137174817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,768,0.01427288850148519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,512,0.013819555441538492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,256,0.013070222404268054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,64,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,32,0.003532444437344869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,128,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,64,0.012732444538010491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,32,0.013619555367363824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,65536,0.1581439971923828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,51200,0.12898400094774035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,16384,0.04558577802446154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,65536,0.22501866022745767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,12288,0.03649066554175483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,16384,0.06520177920659383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,10240,0.03204710947142707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,51200,0.17836533652411568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,12288,0.04990399877230326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,7168,0.02488533324665493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,6144,5120,0.020234665936893888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,6144,0.02238044473859999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,7168,0.03286044465170966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,5120,0.019561777512232464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,6144,0.029186666011810303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,4096,0.016494222813182406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,6144,1536,0.015827554795477126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,5120,0.02572533322705163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,3584,0.015666666958067153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,4096,0.023392889234754775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,3072,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,2560,0.010312000082598792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,3584,0.021910222040282354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,3072,0.020626667473051283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,2048,0.008995555341243744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,2560,0.018767111831241183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,1536,0.007910221815109253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,1024,0.005927111125654644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,2048,0.016976000534163583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,768,0.004895110925038655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,1536,0.01550222271018558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,1024,0.01427111029624939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,768,0.014150222142537435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,8192,0.02910400099224514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,256,0.0038693332009845306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,512,0.013411555853154926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,10240,0.04291911257637871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,128,0.003896000070704354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,8192,0.03622755408287048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,64,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,256,0.012729778057999082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,32,0.003528000166018804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,128,0.012422222230169507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,64,0.012786666552225748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,5120,32,0.012448888685968188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,65536,0.12190755208333333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,51200,0.09679644637637669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,12288,0.029987557066811457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,10240,0.024999999337726172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,51200,0.14762400256262884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,16384,0.05453777644369337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,8192,0.02107200026512146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,12288,0.04196000099182129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,7168,0.018575999471876357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,6144,0.016354666815863717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,10240,0.03651377889845107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,8192,0.03144711256027222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,5120,0.01424088908566369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,7168,0.029099557134840224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,4096,0.015323556131786771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,3584,0.01384800010257297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,6144,0.025383111503389146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,3072,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,5120,0.02331466641690996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,2560,0.011001778145631155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,4096,0.020822222034136455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,3584,0.01984444426165687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,5120,512,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,2048,0.00979555563794242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,3072,0.017875555488798354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,1536,0.008302222523424361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,1024,0.006552888701359431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,2560,0.016513778103722464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,768,0.005592888842026393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,2048,0.015237333046065437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,512,0.004911111046870549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,1536,0.014608888162506951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,256,0.0038248888320393036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,128,0.003485333174467087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,768,0.013412444127930535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,512,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,64,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,256,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,32,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,128,0.012042666474978128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,4096,16384,0.038669334517584905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,65536,0.1129395564397176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,64,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,51200,0.09138933155271743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,65536,0.1882951127158271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,16384,0.03735466798146566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,12288,0.029896888468000624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,65536,0.18450844287872314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,10240,0.02402666707833608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,51200,0.1459991137186686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,16384,0.05337244603368971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,8192,0.02015644477473365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,12288,0.04048444496260749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,7168,0.017868444323539734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,6144,0.015832000308566622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,8192,0.031327111853493586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,5120,0.014140443669425117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,7168,0.028635554843478735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,6144,0.02531911101606157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,5120,0.023014222582181294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,3584,0.010313777459992303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,4096,0.020635555187861126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,3072,0.010781333678298526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,1024,0.013461333182122974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,2560,0.008620444271299574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,3072,0.01750666730933719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,2048,0.007596444752481248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,2560,0.016516443755891588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,1536,0.006607111129495833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,4096,32,0.012780444489585029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,2048,0.015386665860811869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,1024,0.0052737775776121355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,768,0.004648000001907349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,1536,0.014461333552996317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,512,0.0042053332759274375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,1024,0.013470222552617392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,256,0.003555555724435382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,768,0.013584888643688627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,128,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,512,0.013090666797426013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,10240,0.03527733352449205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,64,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,256,0.012358222570684222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,32,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,128,0.012090666426552666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,64,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3584,4096,0.01090400003724628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,65536,0.08414577775531346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,32,0.01202488856183158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,16384,0.028684443897671167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,51200,0.06806311342451307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,12288,0.023982221881548565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,10240,0.022659555077552795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,16384,0.050980445411470204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,51200,0.14261333147684732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,8192,0.01752711170249515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3584,3584,0.019561777512232464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,12288,0.039447112215889826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,7168,0.01720977822939555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,6144,0.014720888601409065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,5120,0.013946667313575745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,10240,0.03492088781462775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,8192,0.030518223841985066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,7168,0.02843911117977566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,6144,0.024900444679790076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,3584,0.011067555182509951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,3072,0.010026666853162978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,5120,0.022572444544898138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,2560,0.008992888861232335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,3584,0.018896889355447557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,2048,0.007927999728255803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,1536,0.006572444405820634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,2560,0.016131555040677387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,1024,0.005199111170238919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,2048,0.015188443991872998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,1536,0.014427555931939019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,768,0.00452977791428566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,512,0.0038604442444112566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,1024,0.013447110851605734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,256,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,768,0.013397333522637686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,512,0.013090666797426013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,128,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,64,0.002975111206372579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,256,0.012113778127564324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,32,0.003145777723855443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,128,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,65536,0.17917688687642416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,64,0.011692444483439127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,32,0.011687999798191918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,65536,0.08101422256893583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,51200,0.06536622179879083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,16384,0.027181333965725366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,12288,0.02238222294383579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,3072,4096,0.012257777982287936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,65536,0.17762311299641928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,16384,0.0503386656443278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,10240,0.019493333167499967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,51200,0.14096444182925755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,8192,0.019083556201722886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,7168,0.013441777891582914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,4096,0.01979377700222863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,6144,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,5120,0.010709332923094431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,8192,0.03016177813212077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,3072,3072,0.017328888177871704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,7168,0.027954667806625366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,4096,0.011240888800885944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,3584,0.011071999867757162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,6144,0.024516445067193773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,3072,0.011037333144081963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,5120,0.021311110920376245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,2560,0.008314666648705801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,4096,0.019294222195943195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,2048,0.007481777833567725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,3584,0.018195556269751657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,3072,0.01687022215790219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,1536,0.006218666831652324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,1024,0.004912000149488449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,2560,0.015916445189052157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,2048,0.014892444014549255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,1536,0.014112888111008538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,1024,0.01344622257683012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,512,0.004204444587230682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,256,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,768,0.013177778157922955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,128,0.0032355555643637977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,512,0.012803555362754397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,64,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,256,0.012328888807031842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,32,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,128,0.011766222616036734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,64,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,65536,0.06651910808351305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,32,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,51200,0.05303466651174757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,16384,0.023702222439977858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,12288,0.03952444593111674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,65536,0.13892355230119494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2560,10240,0.03439822130733066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,12288,0.018702222241295707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,51200,0.11054311196009318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,10240,0.01835466590192583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,16384,0.040059556563695274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,8192,0.014615999327765571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,7168,0.015231110983424716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,6144,0.011695110963450538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,12288,0.03174044357405768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,5120,0.01236088905069563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,7168,0.0236453331179089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,4096,0.009016888837019602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,6144,0.020582222276263766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2560,768,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,3584,0.008953777452309927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,5120,0.018214222457673814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,3072,0.007638221813572778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,2560,0.00664444433318244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,4096,0.01683111157682207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,3584,0.01614755557643043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,2048,0.006934222247865465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,3072,0.015097777048746744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,1536,0.0052168890833854675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,2560,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,1024,0.004537777768241035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,768,0.004238222208287981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,2048,0.013747555514176687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,1536,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,512,0.0035946667194366455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,1024,0.012768000364303589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,768,0.01274222218328052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,128,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,512,0.01242844429281023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,64,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,256,0.011878222227096558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,32,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,128,0.01184622198343277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,65536,0.04856355653868782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,64,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,32,0.011422221859296164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,51200,0.04007200068897671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,16384,0.01787911189926995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,12288,0.017159110969967313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,10240,0.02852355440457662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,65536,0.13537689050038657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,51200,0.10764533281326294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,2048,8192,0.025403555896547105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,16384,0.03859466645452712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,10240,0.015118221441904703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,8192,0.01408088869518704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,7168,0.012545777691735161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,12288,0.03083733386463589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,6144,0.011119999819331698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,5120,0.010037333601050908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,10240,0.028156446086035833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,4096,0.008739555875460306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,7168,0.023269333773189124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,8192,0.02437866727511088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,3584,0.00793511089351442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,6144,0.01995022263791826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,5120,0.01789777808719211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,3072,0.007290666302045186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,2560,0.007275555696752336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,2048,0.006241777704821692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,4096,0.016884444488419425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,1536,0.006061333335108227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,3584,0.016161777906947665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,3072,0.014841778410805596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,1024,0.004581333448489507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,768,0.0041804446114434134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,2560,0.01425244410832723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,512,0.0038319999972979226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,2048,0.013766222529941134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,1536,0.013440888788965015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,256,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,1024,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,128,0.0029475556479560006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,768,0.012503999802801343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,2048,256,0.0034871109657817413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,64,0.002899555489420891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,512,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1536,32,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,256,0.011715555356608497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,128,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,65536,0.03637866510285272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,64,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1536,32,0.011780444118711682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,12288,0.013208000196350945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,65536,0.13201155927446154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,16384,0.03811288873354594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,51200,0.10494044754240249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,10240,0.014196443888876172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,8192,0.012108444339699216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,12288,0.030988444884618122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,7168,0.011530666715568967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,6144,0.010491555763615502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,10240,0.02739288906256358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,8192,0.023436443673239812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,5120,0.011152000062995486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,7168,0.021754667162895203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,4096,0.008605333666006723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,3584,0.00794311116139094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,6144,0.019561777512232464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,3072,0.007610666255156199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,5120,0.017647110753589206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,2560,0.006598222172922558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,4096,0.016555555992656283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,3584,0.01591999994383918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,3072,0.01480977733929952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,1536,0.0052471111218134565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,2560,0.014141332772043018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,1024,0.004224888980388641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,2048,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,768,0.003871110992299186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,1536,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,512,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,1024,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,256,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,768,0.012452444268597497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,128,0.0028799999919202593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,51200,0.029808001385794744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,16384,0.015229332778188916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,512,0.01240888900227017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,64,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,32,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,256,0.011764444410800934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,128,0.011698666546079846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,65536,0.028991109795040552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,64,0.011350221931934357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,1024,32,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,16384,0.017051556044154696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,12288,0.01477688882086012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,65536,0.13051644961039224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,51200,0.10378844208187527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,10240,0.01372977760103014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,16384,0.0377146667904324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,8192,0.012101333174440594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,12288,0.030061334371566772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,7168,0.010848888920413123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,10240,0.026389333936903212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,6144,0.010047111246320937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,8192,0.023041778140597876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,5120,0.008671999805503422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,4096,0.007985778152942657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,1024,2048,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,3584,0.007299555672539606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,6144,0.019554666346973844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,3072,0.006631111105283101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,5120,0.017861333158281114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,2560,0.005930666708283954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,4096,0.01648266613483429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,2048,0.005251555393139522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,3584,0.016202666693263583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,1536,0.004899555610285865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,3072,0.01479822231663598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,1024,0.004232888834344016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,2560,0.014318222800890604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,768,0.0038728887836138406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,2048,0.013404444687896304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,512,0.003536888708670934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,1536,0.013439999686347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,256,0.003489777859714296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,1024,0.01274222218328052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,768,0.012455999851226807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,512,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,64,0.003014222201373842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,256,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,128,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,65536,0.02566577825281355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,64,0.011368888947698804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,51200,0.024355555574099224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,16384,0.011686222420798408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,65536,0.12930222352345785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,12288,0.010066666536860997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,51200,0.1019173330730862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,16384,0.037088887559043035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,10240,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,12288,0.029551111989551123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,7168,0.021613332960340712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,8192,0.011104889214038849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,10240,0.02607733342382643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,7168,0.010392000277837118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,6144,0.009639110830095079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,8192,0.022629333866967097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,7168,0.021631111701329548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,5120,0.008949333594905006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,6144,0.019440000255902607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,4096,0.007932444413503012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,3584,0.007247111035717859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,5120,0.017878222796652053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,3072,0.006330666856633292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,4096,0.01646399994691213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,3584,0.015802666544914246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,2560,0.005920889063013925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,2048,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,1536,0.004902222090297275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,3072,0.014782221780882942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,2560,0.01422044469250573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,1024,0.0041804446114434134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,2048,0.013412444127930535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,768,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,768,32,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,512,0.0032924444725116095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,1536,0.013055110971132914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,256,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,128,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,1024,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,768,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,64,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,512,0.012437333663304647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,256,0.011692444483439127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,65536,0.02127200033929613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,128,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,64,0.011354666617181567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,51200,0.019327110714382596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,512,32,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,16384,0.010030222435792288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,12288,0.009009777671760982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,65536,0.1275600062476264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,16384,0.035304887427224055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,10240,0.009307555854320526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,12288,0.02887822190920512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,8192,0.008624888956546783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,7168,0.009360888765917884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,10240,0.02607022225856781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,8192,0.022887110710144043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,6144,0.009742221898502773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,7168,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,5120,0.00869422240389718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,768,128,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,4096,0.007635555333561367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,3584,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,6144,0.019271110494931538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,5120,0.01755822201569875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,3072,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,4096,0.016377778516875375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,2560,0.005718222094906702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,3584,0.015860444969601102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,2048,0.005048888838953442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,51200,0.02055999967787001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,1536,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,3072,0.014436443646748861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,1024,0.0041991112132867174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,2560,0.014073777529928418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,768,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,2048,0.013772444592581855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,512,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,1536,0.013088000317414602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,256,0.002887111157178879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,1024,0.012317332956526013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,128,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,768,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,64,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,256,32,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,512,0.012420444852775998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,256,0.011422221859296164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,128,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,64,0.011352889239788055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,51200,0.014669333895047506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,32,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,16384,0.009644444617960189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,12288,0.009716444545321995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,256,51200,0.10025244288974339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,65536,0.12615644931793213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,10240,0.009103111094898647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,51200,0.09954577684402466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,16384,0.03571466604868571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,8192,0.00831911133395301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,12288,0.028720001379648846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,7168,0.009293333523803288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,6144,0.008584889272848764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,10240,0.026030222574869793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,8192,0.022310222188631695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,7168,0.021270222134060327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,4096,0.007307555940416124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,6144,0.0192266669538286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,3584,0.006879999819729064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,5120,0.01756444407833947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,3072,0.006256888724035687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,3584,0.015632889337009855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,2560,0.005669333454635408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,3072,0.014480888843536377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,2048,0.005234666582610872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,512,32,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,2560,0.014195554786258273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,1536,0.004517333375083076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,1024,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,2048,0.013335111240545908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,768,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,65536,0.016844444804721408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,1536,0.013060444758998023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,512,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,1024,0.01220533334546619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,256,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,128,0.0028497777465316984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,512,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,256,0.011522666447692446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,32,0.002536888958679305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,64,0.011528888510333167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,128,5120,0.008625778059164682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,4096,0.015882665912310284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,65536,0.1252924468782213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,51200,0.019567999574873183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,16384,0.009342222577995723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,51200,0.098907556798723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,16384,0.03460888730155097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,12288,0.009638222555319468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,10240,0.008711111214425828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,12288,0.028456889920764502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,10240,0.025536888175540503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,8192,0.008271111382378472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,7168,0.009000889129108852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,8192,0.022325333621766832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,128,0.011686222420798408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,7168,0.020946666598320007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,5120,0.007598222129874759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,32,0.011032000184059143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,6144,0.01924977699915568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,4096,0.0069360000391801195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,5120,0.01740444368786282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,3584,0.0069191112286514705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,3072,0.0062871111763848206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,2560,0.005680000202523337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,4096,0.01644444465637207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,3584,0.015294222368134392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,2048,0.004911111046870549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,3072,0.014461333552996317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,1536,0.0042462220622433555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,1024,0.00387999994887246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,2048,0.013050666285885705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,1536,0.012784000072214337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,768,0.003546666767862108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,512,0.00318755561278926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,1024,0.012776888906955719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,256,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,768,0.012216000093354119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,512,0.011748444702890186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,256,0.011971555650234222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,64,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,128,0.01107377807299296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,128,768,0.012284444438086616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,32,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,65536,0.024320888850424025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,32,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,51200,0.020280000236299302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,65536,0.024334222078323364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,16384,0.012772444221708508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,51200,0.09862133529451157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,12288,0.009318222602208456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,16384,0.03503111004829407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,10240,0.008660444782839881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,2560,0.014352000421947904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,8192,0.008114666574531132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,10240,0.02574311031235589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,7168,0.008965333302815756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,8192,0.022674666510687932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,6144,0.008415111237102086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,128,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,5120,0.00794400026400884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,7168,0.021295999487241108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,4096,0.006968888971540663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,6144,0.019277332557572257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,3584,0.0069351109365622205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,5120,0.017507554756270517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,64,64,0.011434666812419891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,3072,0.006220444622966979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,4096,0.016194666425387066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,2560,0.005542222410440445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,64,6144,0.008256889051861232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,3584,0.01581333412064446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,2048,0.004986666556861666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,1536,0.004530666602982415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,1024,0.0038622220357259116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,3072,0.014826666977670459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,2560,0.014110222458839417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,65536,0.12463288837009007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,768,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,2048,0.013125333521101209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,1536,0.012895111408498553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,512,0.0031973332580592898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,256,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,128,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,1024,0.012758221891191272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,64,0.002559111143151919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,768,0.012077333198653327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,512,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,193,32,32,0.0025155554629034465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,128,0.01108266661564509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,64,0.011607111328177981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,32,0.010713777608341642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,16384,0.3938071197933621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,16384,0.30230310228135854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,12288,0.2996879948510064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,51200,0.9223946465386285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,256,0.011760888828171624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,51200,1.2340728971693251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,12288,0.22406310505337187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,193,32,12288,0.02878311276435852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,10240,0.2372666729821099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,8192,0.1963111162185669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,10240,0.19044978088802764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,8192,0.15576533476511636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,7168,0.17061955398983428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,7168,0.13540355364481607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,6144,0.14618399408128527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,12288,0.24831644694010416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,10240,0.2080533372031318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,16384,0.32777778307596844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,6144,0.11656978395250107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,8192,0.17174133989546034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,5120,0.10859111282560562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,4096,0.10342311196857029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,7168,0.1513004435433282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,3584,0.09197688764995998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,4096,0.0867982241842482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,3584,0.07390489180882771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,5120,0.11629777484469944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,3072,0.08019289043214586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,6144,0.13334043820699057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,4096,0.0988488859600491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,2560,0.06411911381615533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,3072,0.06519822279612224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,3584,0.09027110868030125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,2048,0.053152001566357084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,2560,0.05787822273042467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,3072,0.08220444122950236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,1536,0.041053334871927895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,5120,0.12751466698116726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,2048,0.05048355460166931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,2560,0.07487110959159003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,1024,0.0306951105594635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,2048,0.0655991103914049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,768,0.02386133372783661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,1536,0.05647822221120199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,1024,0.034309334225124784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,1024,0.04941066768434313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,768,0.029167999823888142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,768,0.04423822296990288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,256,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,512,0.02475555572244856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,512,0.03971555497911241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,128,0.010392888552612728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,256,0.022575111852751836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,64,0.008994667066468133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,256,0.03568533394071791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,32,0.010749333434634738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,128,0.021614222062958613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,128,0.030072000291612413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,64,0.020963556236690942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,32,0.028354667954974707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,65536,1536,0.04155022237035964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,65536,512,0.017200888858901132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,51200,0.7406284544203016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,65536,0.9377430809868706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,65536,1.0922213660346138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,51200,0.8488942252265083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,16384,0.2767519950866699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,12288,0.21688621573977998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,16384,0.24200532171461317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,12288,0.18250755469004312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,65536,51200,1.0169777340359158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,10240,0.15330755710601807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,10240,0.18809866905212402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,8192,0.1661306619644165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,7168,0.13706933127509222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,12288,0.20864889356825086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,7168,0.1129582193162706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,10240,0.17712710963355172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,8192,0.1484337780210707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,6144,0.11537955866919623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,6144,0.09616266356574164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,5120,0.09825066725413005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,5120,0.08182044161690606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,8192,0.12811199824015299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,7168,0.13265244166056314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,6144,0.11704977353413899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,4096,0.08169155650668673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,4096,0.06868710782792833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,3584,0.07163021961847942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,5120,0.10279555453194512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,3072,0.06446399953630236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,3584,0.06185511085722181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,4096,0.0879253347714742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,3072,0.05524444580078125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,2560,0.05584177705976698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,3584,0.08076355854670207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,2560,0.04870133267508613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,16384,0.27359289593166775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,2048,0.044165333112080894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,3072,0.07329777876536052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,1536,0.0344524449772305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,2048,0.04247911108864678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,2560,0.06659911076227824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,1024,0.026887999640570745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,1536,0.03593422306908502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,1536,0.05236000153753492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,768,0.02039377722475264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,1024,0.02942044536272685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,1024,0.045736889044443764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,512,0.014997333288192749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,768,0.025760889053344727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,768,0.04125244418780009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,512,0.03845599955982632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,256,0.011351111034552256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,256,0.020230222079488967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,128,0.00888177752494812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,256,0.03385600116517808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,64,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,128,0.028134223487642076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,128,0.01891288823551602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,51200,32,0.007617777420414819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,64,0.019274666905403137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,32,0.022301332818137273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,65536,0.3829030990600586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,51200,0.8359813160366483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,65536,0.3836071226331923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,51200,0.29956176545884877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,51200,512,0.021828444467650518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,51200,0.31570132573445636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,16384,0.09894933303197224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,12288,0.07645777861277263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,16384,0.10405244429906209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,65536,1.104434649149577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,12288,0.07959733406702678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,10240,0.06773955292171903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,16384,0.12439021799299453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,12288,0.09825422366460164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,10240,0.06800266769197252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,8192,0.05482666691144308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,51200,2048,0.059340443876054555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,7168,0.046880000167422824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,8192,0.0595831142531501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,6144,0.040700445572535195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,7168,0.05272000034650167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,10240,0.09532533089319865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,8192,0.0751004417737325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,5120,0.036355555057525635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,6144,0.044663998815748424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,4096,0.02948444419436985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,51200,0.3419582313961453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,6144,0.061971558464898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,7168,0.0698524448606703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,5120,0.03900977638032701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,65536,0.4350506729549832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,5120,0.057032002343071826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,4096,0.034190220965279475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,3072,0.02335111134582096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,3584,0.03127022253142463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,2560,0.019546666079097323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,4096,0.04983555608325534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,3072,0.028135110934575398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,3072,0.04397955536842346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,2048,0.016184000505341422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,2560,0.024892444411913555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,2560,0.040955556763543025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,2048,0.022819555468029443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,2048,0.03780000077353583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,1024,0.01038577738735411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,1536,0.020259555843141343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,1536,0.03460977805985345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,768,0.008879111044936711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,1024,0.03199999862247043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,1024,0.01813155578242408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,512,0.007263999846246507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,768,0.016530666086408827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,256,0.004946666873163647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,512,0.014908444550302295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,512,0.027067555321587458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,128,0.004506666627195147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,256,0.014110222458839417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,256,0.02439022229777442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,64,0.004809777769777509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,32,0.004584889031118817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,128,0.02160800000031789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,128,0.013976888524161445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,64,0.013520888984203339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,3584,0.026263111167483862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,16384,32,0.01387466655837165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,3584,0.04731111062897576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,65536,0.27826934390597874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,16384,1536,0.013091555900043912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,51200,0.21511733531951904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,65536,0.29926400714450413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,16384,0.07502755853864881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,12288,0.05751466751098633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,51200,0.23766843477884927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,16384,0.08080266581641303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,16384,768,0.029098666376537744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,10240,0.047636446025636464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,12288,0.06404355499479505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,16384,0.12177688545650905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,10240,0.05481688843833076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,8192,0.04119377666049533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,7168,0.03606755534807841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,12288,0.09705866707695855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,8192,0.04828177889188131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,10240,0.08570133315192328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,7168,0.04352444410324097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,8192,0.07420355743832059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,6144,0.03054222133424547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,5120,0.026700443691677515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,7168,0.06863022512859769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,6144,0.03661422265900506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,6144,0.061266667313045926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,4096,0.0229404436217414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,5120,0.031890667147106595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,5120,0.055255999167760216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,4096,0.028598222467634413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,3584,0.01977066695690155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,3072,0.017879999346203275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,4096,0.049152887529797025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,2560,0.014782221780882942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,3584,0.025379555092917547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,3584,0.04626489016744825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,51200,0.3327004379696316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,65536,0.4231706725226508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,3072,0.04282133446799385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,1536,0.01072622256146537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,2560,0.04026133484310574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,2560,0.022035555707083807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,1024,0.008983111215962304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,2048,0.03728355632887946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,1536,0.018209778600268893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,1536,0.03331644336382548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,768,0.007598222129874759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,1024,0.016211556063758004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,1024,0.031108445591396753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,512,0.005904888941182031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,768,0.029751999510659113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,768,0.014891554911931356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,256,0.004545777622196409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,512,0.014121777481502958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,512,0.02637600070900387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,128,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,256,0.013358222113715278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,64,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,128,0.021783999270863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,128,0.013076444466908773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,32,0.0038693332009845306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,64,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,32,0.013936888840463428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,65536,0.266757329305013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,3072,0.023407111565272015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,12288,2048,0.012878222597969903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,65536,0.28261510531107586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,51200,0.2057715521918403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,12288,2048,0.02017688916789161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,16384,0.06942222515741985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,12288,0.054409778780407377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,51200,0.22346843613518608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,16384,0.07982044749789767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,12288,0.061695112122429736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,10240,0.04688622223006355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,12288,256,0.024325332707828943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,16384,0.12187822659810384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,12288,0.09683644771575928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,8192,0.03862133291032579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,10240,0.053188443183898926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,7168,0.03356355428695679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,10240,0.08503378099865383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,8192,0.0471111105548011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,6144,0.02986577815479702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,8192,0.07380800114737616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,7168,0.04171644316779243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,7168,0.06838311089409722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,5120,0.025871111287011042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,6144,0.060589333375295006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,4096,0.021511110994550917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,65536,0.42037778430514866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,5120,0.03088266650835673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,5120,0.05439466569158766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,3584,0.01926666663752662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,4096,0.027132444911532935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,4096,0.04843733376926846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,3072,0.017190222938855488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,3584,0.024678222007221643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,3584,0.045143110884560474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,2560,0.014582221706708273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,3072,0.04212444358401828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,3072,0.023215111758973863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,2048,0.01276533305644989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,2560,0.039734221167034574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,2560,0.021495999561415777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,1536,0.010649777948856354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,2048,0.03684533304638333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,2048,0.019540444016456604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,1024,0.008968888885445064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,1536,0.017856889300876193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,768,0.007098666495747036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,1024,0.02955555584695604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,1024,0.015562666787041558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,512,0.005884444548024072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,768,0.014515555567211576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,256,0.004683555414279302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,768,0.027790221903059218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,512,0.026570666167471144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,512,0.014031110538376702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,128,0.0041697778635554844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,6144,0.03504533237881131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,256,0.024668445189793903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,64,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,51200,0.3308088779449463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,10240,32,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,128,0.02125599980354309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,64,0.012431110772821637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,32,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,65536,0.19526133272382948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,51200,0.15338844723171657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,65536,0.23936711417304146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,16384,0.053448888990614146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,10240,1536,0.03252355588807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,51200,0.19003821743859184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,16384,0.06892177793714735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,12288,0.04148533278041416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,12288,0.05401866634686788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,10240,0.034154666794670954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,16384,0.08962133195665146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,12288,0.0722000002861023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,8192,0.029205332199732464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,10240,0.04698488778538174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,128,0.01311288856797748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,65536,0.28353243403964573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,10240,0.06453422043058607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,51200,0.22597156630622017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,8192,0.0406675570540958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,6144,0.022425777382320825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,8192,0.05667822228537666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,7168,0.03554844525125291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,6144,0.03058755397796631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,6144,0.04703199863433838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,4096,0.016344888342751395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,5120,0.027240888939963445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,5120,0.04354666670163473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,3584,0.01443555619981554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,4096,0.02404977712366316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,4096,0.03934489025010003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,3072,0.012706666356987424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,3584,0.022452443838119507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,3584,0.03728177812364366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,2560,0.011328000161382886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,3072,0.021065778202480737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,3072,0.035818666219711304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,2048,0.009763555394278632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,2560,0.019546666079097323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,2560,0.03405333227581448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,1536,0.008722667064931657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,2048,0.01837688850031959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,2048,0.03245688809288873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,1024,0.006619555668698416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,1536,0.016210666961140104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,1536,0.0277502222193612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,7168,0.025448888540267944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,1024,0.014482667048772177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,1024,0.026710222164789837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,512,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,5120,0.01924800044960446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,768,0.024699555502997503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,256,0.003879111260175705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,512,0.013414222333166333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,512,0.024653333756658766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,128,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,256,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,256,0.02300888962215847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,64,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,128,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,128,0.019595555133289762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,32,0.0038248888320393036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,64,0.012049777640236748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,32,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,65536,0.18443732791476777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,10240,256,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,51200,0.13855377833048502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,65536,0.23454843627081978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,8192,768,0.005593777944644292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,16384,0.048897776338789195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,51200,0.18581422170003256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,8192,7168,0.052876445982191295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,12288,0.03763466742303636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,16384,0.06782399945788913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,16384,0.08813244766659206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,12288,0.05273155702484978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,10240,0.03194222185346816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,65536,0.27792978286743164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,8192,0.027375110321574744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,51200,0.22291199366251627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,10240,0.04609866605864631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,7168,0.024030221833123103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,10240,0.0638293359014723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,8192,0.0388408899307251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,6144,0.021021333005693223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,8192,0.05609955390294393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,7168,0.03467466764979892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,5120,0.01798488861984677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,7168,0.051911999781926475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,6144,0.030004445049497817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,6144,0.04648355642954508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,5120,0.02619733413060506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,5120,0.043318221966425575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,3584,0.013550221920013428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,4096,0.02370044423474206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,3072,0.012421333127551608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,3584,0.03724088933732774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,3584,0.022242666946517095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,2560,0.01089511149459415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,8192,768,0.013839110732078552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,3072,0.020608888732062448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,3072,0.035226666265063815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,2560,0.019342222147517733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,2560,0.03376355436113145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,1536,0.007987555530336168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,2048,0.017542221479945712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,2048,0.031544887357287936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,1024,0.00629333323902554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,1536,0.016378665963808697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,1536,0.02734577821360694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,12288,0.07158133056428698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,768,0.005570666657553778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,1024,0.027160889572567407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,1024,0.014449778530332776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,768,0.013792888985739814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,512,0.013122667041089801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,512,0.024679111109839544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,256,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,4096,0.01532799998919169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,128,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,256,0.012732444538010491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,256,0.024005333582560223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,4096,0.039035555389192365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,64,0.0032222221295038858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,32,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,128,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,128,0.020229332976871066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,64,0.01277955538696713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,7168,32,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,2048,0.009563555320103964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,65536,0.18207911650339761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,65536,0.19630132781134713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,51200,0.1316666603088379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,16384,0.04814666509628296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,51200,0.155967116355896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,12288,0.03675644596417745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,16384,0.057951112588246666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,7168,512,0.004492444296677907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,16384,0.08372977707121108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,12288,0.04531466629770067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,10240,0.03141511148876614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,12288,0.06875110997094049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,8192,0.026175111532211304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,10240,0.03913244605064392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,51200,0.21204622586568198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,10240,0.061047997739579946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,65536,0.26532000965542263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,8192,0.03349599904484219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,7168,0.02268444498380025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,8192,0.053977777560551964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,6144,0.019547555181715224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,5120,0.017471111483044095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,7168,0.050548444191614784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,7168,0.029623998536003962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,6144,0.045257776975631714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,6144,0.025942222939597234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,5120,0.023741333021057978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,3584,0.012396444049146442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,5120,0.0424924459722307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,4096,0.02137511140770382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,3072,0.01201333353916804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,3584,0.020267556111017864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,3584,0.036496000157462224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,2560,0.01035199976629681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,3072,0.018930666976504855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,2048,0.009315555294354757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,2560,0.033407111962636314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,2560,0.017687110437287223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,2048,0.015802666544914246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,1536,0.007932444413503012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,2048,0.03152622116936578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,7168,768,0.024785778588718835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,1024,0.006625777731339137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,1536,0.028463999430338543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,1024,0.013620444469981723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,1024,0.025791999366548326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,768,0.005271111097600725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,512,0.004519111166397731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,768,0.02496799992190467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,4096,0.015103111664454142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,256,0.0035502223504914176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,512,0.024043555061022442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,512,0.01279022213485506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,128,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,4096,0.03828444414668613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,256,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,256,0.022301332818137273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,64,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,6144,32,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,3072,0.03467288944456313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,6144,128,0.019880000087949965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,128,0.012040889097584618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,64,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,32,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,65536,0.14503644572363958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,51200,0.11789955033196343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,65536,0.19141066074371338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,16384,0.04672355453173319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,51200,0.15358044041527644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,1536,0.014775110615624322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,12288,0.036483556032180786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,16384,0.05641600158479479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,10240,0.030290666553709242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,16384,0.0831893351342943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,12288,0.0435751113626692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,12288,0.06791910860273573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,8192,0.02603200078010559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,6144,768,0.01347733371787601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,65536,0.2627066771189372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,10240,0.03680177860789829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,10240,0.06049599912431505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,51200,0.20891200171576607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,8192,0.03229511115286086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,6144,0.020177778270509508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,8192,0.05326666765742832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,5120,0.01702577703528934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,7168,0.02922755479812622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,7168,0.049963557057910495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,4096,0.014363555444611443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,6144,0.044284443060557045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,6144,0.02570666703912947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,5120,0.023416888382699754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,5120,0.04145777887768216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,3072,0.011628444823953839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,4096,0.036997334824668035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,4096,0.021164443757798936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,3584,0.03606311149067349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,3584,0.0199297782447603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,2560,0.010036444498433007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,2048,0.008971555365456475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,3072,0.018799111247062683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,2560,0.032249778509140015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,2560,0.017460443907313876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,1536,0.007600000335110559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,2048,0.01551822159025404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,2048,0.028993778758578833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,1024,0.005535111245181825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,1536,0.01443288889196184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,768,0.004860444615284602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,1024,0.02569244470861223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,768,0.01314133322901196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,512,0.004182222402758068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,7168,0.02267733381854163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,512,0.012727999852763282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,256,0.0035582222044467926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,512,0.025389333566029865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,3584,0.013028444515334235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,256,0.012413333687517377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,256,0.023676445086797077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,128,0.003532444437344869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,64,0.0032026666320032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,128,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,128,0.020263999700546265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,5120,32,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,3072,0.03419911199145847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,64,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,65536,0.11452889442443848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,32,0.012520888613329994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,51200,0.09039822551939224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,1536,0.028132445282406274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,65536,0.18639822800954184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,16384,0.03463733196258545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,51200,0.14713066154056126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,5120,768,0.02502577834659153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,12288,0.029919111066394385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,16384,0.05403377612431844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,10240,0.026183999247021143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,16384,0.08296266529295179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,12288,0.04046044415897793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,12288,0.06715644730461968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,65536,0.2598373360104031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,8192,0.021264889174037512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,51200,0.2074879937701755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,7168,0.019882667395803664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,10240,0.05942844682269626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,8192,0.030849777989917334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,8192,0.05308444301287333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,6144,0.017643555998802185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,7168,0.04966310991181267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,6144,0.02553422252337138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,5120,0.014101333088344999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,5120,0.02300888962215847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,5120,0.0414613319767846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,4096,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,5120,1024,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,4096,0.037632889217800565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,4096,0.020907556017239887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,3584,0.009610666996902889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,3072,0.00871733327706655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,3584,0.03554666704601712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,3584,0.019398222366968792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,2560,0.00812000036239624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,3072,0.017844445175594754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,2048,0.006917333437336816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,3072,0.032567110326555036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,2560,0.01621866722901662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,10240,0.03564888901180691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,1536,0.005853333406978183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,2048,0.02889333168665568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,1024,0.004635555462704765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,1536,0.02660177813635932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,1536,0.014215999179416232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,768,0.0041475556790828705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,1024,0.013411555853154926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,7168,0.028780443800820246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,1024,0.026038222842746313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,512,0.00387999994887246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,6144,0.04393688837687174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,768,0.0129439996348487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,256,0.0032248888164758682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,768,0.024889777104059856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,128,0.0031973332580592898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,512,0.023980443676312763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,512,0.01278222186697854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,256,0.022333333889643352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,64,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,256,0.012097777591811286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,4096,32,0.0032222221295038858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,128,0.01921688848071628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,128,0.0120319997270902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,64,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,32,0.012079111403889127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,65536,0.12692266040378147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,51200,0.10479733016755845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,65536,0.18056533071729872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,16384,0.040223111708958946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,51200,0.1453360054228041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,12288,0.027407111393080816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,16384,0.052616887622409396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,16384,0.08215200238757663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,4096,2048,0.015125332607163323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,10240,0.02422488894727495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,51200,0.2058017783694797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,65536,0.26013867060343426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,12288,0.0662906699710422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,8192,0.01994755533006456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,10240,0.059333331055111356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,10240,0.03509599963823954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,7168,0.017881777551439073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,8192,0.05273422267701891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,8192,0.030826667944590252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,7168,0.049308445718553334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,5120,0.014441778262456259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,6144,0.02500711050298479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,6144,0.04413422279887729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,4096,0.012337778177526263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,5120,0.04094400008519491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,5120,0.022524444593323603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,3584,0.012383999923865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,4096,0.020250666472646926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,4096,0.03702222307523092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,3072,0.00849866701496972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,3584,0.03564000129699707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,3584,0.018594667315483093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,2560,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,3072,0.01761777698993683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,3072,0.032812443044450544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,2048,0.006559111177921295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,2560,0.015808888607554965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,2560,0.03047910994953579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,1536,0.005471111171775394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,12288,0.04078311059210036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,2048,0.015113777584499784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,2048,0.02849688794877794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,1024,0.0046311111913787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,1536,0.014108444253603617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,1536,0.02574577762020959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,768,0.0041946665280395085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,1024,0.025426665941874187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,6144,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,512,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,7168,0.028196444114049275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,768,0.025006221400366888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,256,0.003489777859714296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,512,0.012740444805887012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,512,0.023333332604832117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,128,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,256,0.012100444071822695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,256,0.023335999912685815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,64,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,128,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3584,32,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3584,128,0.019842666056421068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,64,0.012318222059143914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,32,0.011399110986126794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,65536,0.09786755508846706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,4096,2560,0.03118488854832119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,51200,0.07823822233412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,65536,0.14499821927812365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,16384,0.030237333642111883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,51200,0.1144133276409573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,16384,0.04248088929388258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,1024,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,12288,0.021199999584092036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,65536,0.2574506600697835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,16384,0.08209421899583605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3584,768,0.012888888518015543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,51200,0.20659644073910186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,10240,0.018340445227093168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,12288,0.03344977895418803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,8192,0.015617777903874716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,12288,0.06637244754367404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,7168,0.013389333254761167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,10240,0.02954044606950548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,8192,0.02597066594494714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,8192,0.05236711104710897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,6144,0.012632889052232107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,5120,0.011049778097205691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,7168,0.024357333779335022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,7168,0.04908000098334419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,6144,0.021243555678261652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,6144,0.043904887305365674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,3584,0.008952000074916417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,5120,0.019671999745898776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,4096,0.037068443165885076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,4096,0.017549332645204332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,3072,0.008279999925030602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,3584,0.03395466672049628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,2560,0.00758755538198683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,3072,0.03229599859979417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,3072,0.015464888678656684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,2048,0.006748444504208035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,2560,0.01479288935661316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,2560,0.030847999784681533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,1536,0.005250666704442766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,2048,0.013923555612564087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,2048,0.028817776176664565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,1024,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,1536,0.013447999954223633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,1536,0.025983111725913152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,768,0.003910222401221593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,1024,0.012903999951150684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,1024,0.024364444944593642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,512,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,768,0.012462221913867526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,10240,0.05874311261706882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,256,0.003524444583389494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,512,0.01219555570019616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,512,0.023939554889996845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,128,0.002985777747299936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,4096,0.009654222263230218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,256,0.011772444678677453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,256,0.02258488867017958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,5120,0.04099999864896139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,64,0.003140444349911478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,3072,32,0.0031964443624019623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,128,0.020261334048377145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,128,0.011698666546079846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,65536,0.07744266589482625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,64,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,3584,0.01665422154797448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,3072,32,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,51200,0.061716443962521024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,16384,0.02979822291268243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,65536,0.14204711384243435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,51200,0.11071644226710002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,12288,0.023578666978412207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,16384,0.041245334678226046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,16384,0.0812515550189548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,12288,0.032307555278142296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,12288,0.06559822294447157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,51200,0.20474221971299914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,10240,0.028573334217071533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,8192,0.014543111125628153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,65536,0.2582346598307292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,7168,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,6144,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,8192,0.02535022298494975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,8192,0.05215377940071953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,7168,0.023940443992614746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,7168,0.04902222090297275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,5120,0.010488000180986194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,6144,0.021009777983029682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,3072,768,0.025062221619817946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,6144,0.043374223841561206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,5120,0.01924888955222236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,5120,0.040376000934176974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,3584,0.008671110702885522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,4096,0.016862221890025668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,4096,0.035038222869237266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,3072,0.007923555870850882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,3584,0.016030222177505493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,2560,0.007229333122571309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,3072,0.015132443772421943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,3072,0.03164444367090861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,2048,0.00620977787507905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,2560,0.014444443914625378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,2048,0.013931555880440606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,1536,0.005201777650250329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,2048,0.02837688724199931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,10240,0.016993777619467843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,1024,0.004237333519591225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,1536,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,1536,0.026547556122144062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,768,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,10240,0.0587751136885749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,1024,0.012808000048001608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,1024,0.025751110580232408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,512,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,768,0.024031110935741003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,256,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,512,0.012372444073359171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,512,0.02472177810139126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,128,0.0032231110251612137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,4096,0.009336888790130615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,256,0.023051554958025616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,256,0.011779555843936073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,64,0.002924444360865487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,128,0.011808888779746162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2560,32,0.0034906665484110513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,3584,0.033556444777382746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,64,0.011071110765139261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,65536,0.059296886126200356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,32,0.012127111355463663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,51200,0.04897511005401611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,2560,0.030096888542175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,65536,0.13585778077443442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,16384,0.02330400049686432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,65536,0.2566195593939887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,16384,0.04014933440420363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,51200,0.20347200499640572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,12288,0.019142222073343065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,10240,0.017504889104101393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,12288,0.031679110394583807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,12288,0.06571200158860949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2560,768,0.012553777959611682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,8192,0.013904889424641928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,10240,0.02819377846188015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,7168,0.012809777425395118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,10240,0.058338668611314565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,8192,0.05203288793563843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,8192,0.025137777129809063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,6144,0.011384888655609555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,7168,0.023644444015291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,7168,0.04874311221970452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2560,128,0.020056888461112976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,5120,0.01037688884470198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,6144,0.020784000555674236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,6144,0.04344444473584493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,5120,0.039192001024881996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,5120,0.01885333326127794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,3584,0.008254222571849823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,4096,0.034607112407684326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,4096,0.01664888858795166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,3072,0.0076142218377855085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,3584,0.015863999724388123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,3584,0.03353600038422479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,2560,0.006579555571079254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,51200,0.10982755819956462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,3072,0.014813333749771118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,3072,0.03143822153409322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,2048,0.005557333429654439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,1536,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,2560,0.02979822291268243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,2048,0.028797331783506606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,16384,0.08085155487060547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,2048,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,1024,0.0041777777175108595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,768,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,1536,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,1536,0.025814221964942083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,512,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,1024,0.024681778417693243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,1024,0.012452444268597497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,768,0.024345777100986902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,768,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,256,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,128,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,512,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,512,0.02331377731429206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,256,0.022983999715911016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,256,0.01205599970287747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,64,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,2048,128,0.01923022170861562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,32,0.0028986665937635633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,64,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,65536,0.05551288856400383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,2048,4096,0.008968888885445064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,32,0.011423110961914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,51200,0.04381155636575487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,65536,0.13539111614227295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,51200,0.10527111424340142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,16384,0.017743999759356182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,65536,0.25520533985561794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,16384,0.08086311154895358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,16384,0.038881778717041016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,2560,0.014481777946154276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,12288,0.01607911123169793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,10240,0.01517599986659156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,12288,0.0653911100493537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,10240,0.058147556251949735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,10240,0.028016000986099243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,8192,0.024849777420361836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,8192,0.05208444595336914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,7168,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,2048,128,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,6144,0.011360000405046674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,7168,0.02294755478700002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,7168,0.04809066653251648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,5120,0.010305778019958073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,6144,0.042949332131279834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,5120,0.01847644481394026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,4096,0.008947555389669206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,5120,0.038761778010262385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,3584,0.00797333319981893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,4096,0.01647822227742937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,4096,0.03495644529660543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,3072,0.007074666519959767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,51200,0.20300443967183432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,3584,0.016184889607959323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,2560,0.00628355559375551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,3072,0.01475822263293796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,3072,0.03180088930659824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,12288,0.031230221192042034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,2048,0.005557333429654439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,8192,0.014189332723617554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,2560,0.014473777678277759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,2560,0.02979288829697503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,1536,0.004983110974232356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,1024,0.004168888760937585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,2048,0.027808000644048054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,2048,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,1536,0.026361778378486633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,768,0.0038657776183552216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,1536,0.013110222087966071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,512,0.0035208890007601846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,1024,0.012439111040698158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,768,0.024466666910383437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,768,0.01237155579858356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,256,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,512,0.02366311185889774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,512,0.0124195557501581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,128,0.0028817777832349143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,256,0.02274133265018463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,6144,0.019920888874265883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,128,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1536,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,65536,0.04073333409097459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,64,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,32,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,51200,0.03169155451986525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,3584,0.03286577926741706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,65536,0.13197244538201228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,16384,0.015233778291278414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,51200,0.10262488656573826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,65536,0.25606576601664227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,12288,0.013447999954223633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,16384,0.03797422183884515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,51200,0.2031031052271525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,16384,0.08037600252363417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,10240,0.012527999778588613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,12288,0.030714667505688135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,12288,0.06531466378106011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,1024,0.025379555092917547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,10240,0.027271111806233723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,10240,0.05797866980234782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,7168,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,8192,0.05089955528577169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,8192,0.02423288921515147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,6144,0.010273777776294285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1536,256,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,7168,0.04625155528386434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,7168,0.02165688905451033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,5120,0.00906044410334693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,6144,0.019511999355422128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,4096,0.008280889027648503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,6144,0.04112889038191901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,5120,0.038310223155551486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,5120,0.01789777808719211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,3584,0.007233777807818518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,4096,0.0162808895111084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,3072,0.006619555668698416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,3584,0.03319999906751845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,3072,0.014448889427714877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,3072,0.030935999419954088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,2560,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,2560,0.029678222205903795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,8192,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,2048,0.005558222118351195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,2048,0.028435554769304063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,2048,0.013773333695199756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,1536,0.004552888787455029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,1024,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,1536,0.026385777526431616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,1536,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1536,128,0.019164444671736825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,768,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,1024,0.012711111042234631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,512,0.003539555602603488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,1024,0.025431111454963684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,4096,0.03424711028734843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,768,0.012412444584899478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,256,0.0031964443624019623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,512,0.02336799932850732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,512,0.012096888489193387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,128,0.002983999955985281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,256,0.022299556268586054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,256,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,32,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,1024,2560,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,128,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,65536,0.031790223386552595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,64,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,32,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,51200,0.026150221625963848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,65536,0.12561689482794866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,16384,0.012888000243239932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,51200,0.1018106672498915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,65536,0.25484977828131783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,51200,0.20366577307383218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,12288,0.01146311147345437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,16384,0.03752177622583177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,16384,0.07986666758855183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,12288,0.06496444675657484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,10240,0.026882666680547927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,8192,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,768,0.02366133365366194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,8192,0.022989332675933838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,1024,3584,0.015849777393870883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,7168,0.011210666762457954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,8192,0.05010933346218533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,6144,0.00979200005531311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,1024,128,0.020630222227838304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,7168,0.021631111701329548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,7168,0.045886221859190196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,5120,0.00961599995692571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,6144,0.01923022170861562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,6144,0.04124000006251865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,4096,0.008286221987671321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,5120,0.017880888448821176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,5120,0.03809244434038798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,4096,0.033915556139416166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,4096,0.01648977730009291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,3072,0.006578666468461354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,3584,0.015821332732836407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,3584,0.03263911273744371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,2560,0.005899555567238066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,3072,0.014866666661368476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,10240,0.013185777597957186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,3072,0.030857778257793848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,2048,0.005544888890451855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,12288,0.029983109898037378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,1536,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,2048,0.02812266680929396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,2048,0.013785777820481194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,10240,0.05702755848566691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,1024,0.004200889004601372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,1536,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,1536,0.02642400066057841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,768,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,1024,0.012494222157531314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,1024,0.025095999240875244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,768,0.023307555251651343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,768,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,256,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,512,0.023359111613697473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,128,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,256,0.022062222162882488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,256,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,64,0.002790222151411904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,128,0.01888177792231242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,128,0.01146933353609509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,32,0.0028071111689011254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,64,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,65536,0.026329777306980554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,32,0.011067555182509951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,65536,0.12852444913652208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,51200,0.02091644373204973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,2560,0.014116444521480136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,65536,0.25485067897372776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,16384,0.013750221994188098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,51200,0.10217244757546319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,12288,0.011696000066068439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,16384,0.0370124446021186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,51200,0.20298843913608125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,10240,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,16384,0.0792693363295661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,12288,0.029493331909179688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,12288,0.06433422035641141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,768,512,0.012064889073371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,8192,0.009602666729026372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,10240,0.05580088827345106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,10240,0.026064000195927087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,7168,0.009018667042255402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,6144,0.008374222450786168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,8192,0.02330133318901062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,8192,0.04863111178080241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,7168,0.0455022222465939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,5120,0.00792266676823298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,7168,0.02148977749877506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,768,3584,0.007941332956155142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,4096,0.007649777664078607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,6144,0.04091466797722711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,3584,0.007266666326257918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,5120,0.017503110898865592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,4096,0.03393955694304572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,4096,0.016487111647923786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,3072,0.006286222073766921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,3584,0.032857778999540545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,2560,0.005593777944644292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,3072,0.01478666729397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,768,2560,0.03016177813212077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,2048,0.005254222287072076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,2560,0.029508444997999404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,2048,0.013520888984203339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,2048,0.028031110763549805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,1536,0.004585777719815572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,1536,0.012777778009573618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,1536,0.02622933354642656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,1024,0.004017777740955353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,1024,0.012712000144852532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,1024,0.024725332856178284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,768,0.003569777641031477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,6144,0.019474666979577806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,768,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,768,0.024683554967244465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,5120,0.03836444351408217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,256,0.003137777869900068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,512,0.023363555471102398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,512,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,128,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,256,0.011691555380821228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,3072,0.030692444907294378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,64,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,128,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,128,0.0203457772731781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,32,0.0025351111673646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,2560,0.013939556148317126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,65536,0.020522667302025687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,64,0.01108088923825158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,51200,0.017879999346203275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,65536,0.12640889485677084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,51200,0.09689688682556152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,65536,0.25633690092298717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,16384,0.009696889254781935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,51200,0.2027697828080919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,16384,0.035207112630208336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,16384,0.07812622520658705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,12288,0.00867911097076204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,10240,0.009320889082219865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,512,512,0.0031973332580592898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,12288,0.06255466408199735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,12288,0.028777778148651123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,8192,0.008377778033415476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,10240,0.025701334079106648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,7168,0.007958222594526079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,10240,0.055431998438305326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,3584,0.015483554866578845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,8192,0.022626666559113398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,6144,0.007653333246707916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,512,256,0.022986667023764715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,7168,0.020980444219377305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,7168,0.045534223318099976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,6144,0.019159111711714003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,6144,0.04043733411365085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,4096,0.0076044441925154785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,5120,0.038374221987194486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,5120,0.017345777816242643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,3584,0.00702400008837382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,512,32,0.011708444191349877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,3072,0.0069191112286514705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,4096,0.016036444240146212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,4096,0.033909334076775446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,2560,0.00590844452381134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,3584,0.015225778023401896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,3584,0.032906668053732976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,3072,0.03042844600147671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,3072,0.014783110883500842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,2048,0.005223111146026188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,2560,0.01382844481203291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,2560,0.030163556337356567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,1536,0.004576000074545543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,2048,0.013426666458447775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,2048,0.027845333019892376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,1024,0.0038328886859946777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,1536,0.02539199921819899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,1536,0.01312888910373052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,768,0.0035777779089079965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,1024,0.012372444073359171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,1024,0.0255404445860121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,512,0.0034933334423436057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,768,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,768,0.023835556374655828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,256,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,512,0.023021333747439917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,512,0.012087110843923358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,128,0.002875555513633622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,8192,0.04864977796872457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,256,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,256,0.0229768885506524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,32,0.002491555487116178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,256,128,0.020569778150982328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,65536,0.014987554815080432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,128,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,64,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,51200,0.013386666774749756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,256,32,0.011504000259770287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,16384,0.009694221946928237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,65536,0.12536799907684326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,51200,0.0984133349524604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,65536,0.2554391225179036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,51200,0.20328177346123588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,12288,0.008347555167145198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,10240,0.008971555365456475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,16384,0.07764977878994413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,12288,0.028764443265067205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,10240,0.05544711152712504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,10240,0.025739555557568867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,8192,0.04846133457289802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,8192,0.022620444496472675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,7168,0.007992888490358988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,7168,0.04516444603602091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,7168,0.021264889174037512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,6144,0.007661333514584436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,64,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,5120,0.007264888948864407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,6144,0.018929777873886954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,256,5120,0.00796088907453749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,6144,0.04050488935576545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,4096,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,5120,0.03808800048298306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,5120,0.017197334104114108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,4096,0.016143111719025504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,4096,0.03432800041304694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,3072,0.0062977779242727495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,16384,0.035967999034457736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,3072,0.01479466590616438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,2560,0.006519111080302133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,3072,0.030896888838873968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,12288,0.06255288918813069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,8192,0.008166222108734978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,2048,0.005971555494599872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,2560,0.014170666535695394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,2560,0.030103110604816016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,1536,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,2048,0.013401777380042605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,1024,0.0038204445607132385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,1536,0.013101333545313941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,1536,0.026100445124838088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,768,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,1024,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,1024,0.025078222155570984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,512,0.0031884445084465873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,768,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,768,0.02399377855989668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,256,0.0029279999434947968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,512,0.023642667465739783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,256,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,256,0.022628444764349196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,3584,0.006543111056089401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,128,0.002667555585503578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,64,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,3584,0.015156444576051501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,128,0.011708444191349877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,128,32,0.0026515554636716843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,65536,0.01407999959256914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,32,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,51200,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,65536,0.12412710984547932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,16384,0.008976889153321585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,2048,0.027802666028340656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,12288,0.007962666451931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,51200,0.09857689009772407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,10240,0.007318221860461765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,16384,0.034620443979899086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,12288,0.02849422229660882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,10240,0.02571022179391649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,512,0.012238221863905588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,8192,0.022683555881182354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,7168,0.0069208890199661255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,6144,0.006606222026877933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,7168,0.021321778496106465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,5120,0.006310222049554189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,3584,0.03219377663400438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,6144,0.019294222195943195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,4096,0.005967111223273807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,128,64,0.01073066641887029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,3584,0.006424888968467712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,3072,0.005903111149867375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,5120,0.01774133410718706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,4096,0.01651022169325087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,2560,0.006291555447710886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,3584,0.01516266663869222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,1536,0.004519999855094486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,3072,0.014091556270917257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,2560,0.014146667387750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,1024,0.003920888735188378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,768,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,1536,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,512,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,1024,0.012723555167516073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,768,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,256,0.0028799999919202593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,128,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,512,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,8192,0.006984000404675801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,64,0.0026497778793176017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,32,0.002524444419476721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,128,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,65536,0.014084445105658637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,64,0.011037333144081963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,32,0.011026666396194033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,51200,0.012276444170210095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,16384,0.00850755555762185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,65536,0.12477421760559082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,12288,0.00792622235086229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,51200,0.0966000027126736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,16384,0.03490133417977227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,10240,0.007271111011505127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,8192,0.0069368887278768755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,12288,0.028802666399214003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,7168,0.006639110959238476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,10240,0.025754666990704004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,64,2048,0.005967111223273807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,6144,0.0063493334584765965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,5120,0.006291555447710886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,7168,0.021330666210916307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,2048,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,4096,0.005945777727497949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,3584,0.0063635553750726916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,5120,0.01717155509524875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,3072,0.005963555640644497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,4096,0.01651022169325087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,2560,0.006605333338181178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,3584,0.015513777732849121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,3072,0.014330666926172046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,64,256,0.011414222419261932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,1536,0.004520888957712385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,2560,0.014160888062583076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,1024,0.003871110992299186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,2048,0.013108444710572561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,768,0.003524444583389494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,1536,0.012454222473833295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,512,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,1024,0.012449777788586087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,256,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,768,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,128,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,512,0.011704000333944956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,64,0.002587555597225825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,256,0.011774222056070963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,32,0.0025519999778932994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,128,0.011136888629860349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,64,0.010743111371994019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,8192,0.022476444641749065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,6144,0.019253333409627277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,16384,0.3843982219696045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,192,32,2048,0.005939555664857228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,16384,0.2941226694318983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,12288,0.2929164568583171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,12288,0.21826310952504477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,10240,0.2345502111646864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,51200,0.906952010260688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,51200,1.2053208880954318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,8192,0.19435644149780273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,7168,0.16917778386010063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,10240,0.18621155950758192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,192,32,32,0.011413333316644033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,8192,0.15264177322387695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,6144,0.14394933647579616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,5120,0.1239360041088528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,4096,0.10336799754036798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,6144,0.11448710494571263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,3584,0.08726933267381455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,3072,0.07726933558781941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,4096,0.08109955655203925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,7168,0.13222489092085096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,2560,0.06306755542755127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,3584,0.07273511091868083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,3072,0.06429066922929552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,2048,0.0523173345459832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,2560,0.05698844459321764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,1536,0.04023289018207126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,1024,0.03001333276430766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,768,0.022894221875402663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,512,0.016362667083740234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,1536,0.040934221612082586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,1024,0.033879111210505165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,256,0.010743111371994019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,768,0.03175110949410333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,128,0.009637333452701569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,512,0.025302223033375208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,64,0.009407111340098912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,256,0.02233244478702545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,65536,32,0.01033688916100396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,64,0.02093244426780277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,32,0.020602666669421725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,128,0.021320889393488567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,5120,0.09754133224487305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,16384,0.2922186586591932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,65536,2048,0.04943822158707512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,51200,0.7127484215630425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,65536,0.9285768932766385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,51200,0.9048737419976128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,12288,0.22333423296610513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,12288,0.17655821641286215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,10240,0.20400355921851265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,8192,0.165885329246521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,7168,0.1454088952806261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,8192,0.12531733512878418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,10240,0.1514755619896783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,6144,0.12613956133524576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,7168,0.10742221938239203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,5120,0.10727377732594807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,6144,0.09384710921181573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,4096,0.08724888828065659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,3584,0.07780088980992635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,4096,0.06740266746944852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,3584,0.060805333985222705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,5120,0.08033244477377997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,2560,0.057244446542527944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,16384,0.2364035447438558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,65536,1.1517146428426106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,2048,0.047051555580563016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,2560,0.04820800158712599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,1536,0.036978665325376726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,1024,0.02817866537306044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,2048,0.042091555065578885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,1536,0.03537155522240533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,512,0.01592177814907498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,512,0.022239110536045496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,256,0.01163200040658315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,768,0.028079999817742243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,256,0.020257777637905545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,128,0.019241778386963736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,64,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,32,0.006525333142942852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,3072,0.06832177771462335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,64,0.01924888955222236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,32,0.019544000426928203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,3072,0.05419377817047966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,768,0.021507556239763897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,51200,0.29280710220336914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,65536,0.3759626547495524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,16384,0.09680889050165813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,51200,0.2894382211897108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,12288,0.07475022474924724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,10240,0.062253336111704506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,12288,0.07664266559812757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,16384,0.10075289011001587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,7168,0.04533866710133023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,51200,1024,0.029116445117526587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,51200,128,0.007630222373538547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,8192,0.05801333321465386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,5120,0.034318221939934626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,7168,0.04836533466974894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,6144,0.04344444473584493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,4096,0.028509332074059382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,10240,0.06703555583953857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,3584,0.025290666355027094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,5120,0.038418667183982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,3072,0.022660444180170696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,4096,0.03321955601374308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,2560,0.018903111418088276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,3584,0.030885332160525854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,2048,0.015823110938072205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,1536,0.012665777570671506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,3072,0.02836444311671787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,1024,0.010319111247857412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,2560,0.024681778417693243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,2048,0.022340445054901972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,768,0.008457777400811514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,512,0.006778666542636023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,1024,0.017492444978819955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,256,0.004854222138722737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,768,0.01735911104414198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,65536,0.3675528897179498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,512,0.015471999843915304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,128,0.004261333495378494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,64,0.0038942222793896994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,256,0.014144000079896716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,32,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,128,0.013438222308953604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,64,0.014166222678290473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,32,0.016157334049542744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,6144,0.03946844405598111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,65536,0.27508799235026044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,16384,0.07317599985334608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,51200,0.21606844001346162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,65536,0.282005336549547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,51200,0.2238088978661431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,12288,0.05734044313430786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,10240,0.04745689034461975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,12288,0.061111112435658775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,8192,0.04070399867163764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,16384,0.07937244574228923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,7168,0.03485866718822055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,10240,0.05391377872890896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,16384,1536,0.02017333275742001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,6144,0.030653334326214258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,8192,0.04683466752370199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,5120,0.02665688925319248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,7168,0.0392577780617608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,4096,0.022934221559100684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,3584,0.01982311076588101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,6144,0.035431110196643405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,3072,0.017502221796247695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,5120,0.03156800071398417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,2560,0.014561777313550314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,4096,0.027871999475691054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,3584,0.025225778420766194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,2048,0.012828444441159567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,1536,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,3072,0.0229102224111557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,16384,8192,0.05275377631187439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,1024,0.008660444782839881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,768,0.007598222129874759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,2560,0.02130488885773553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,2048,0.019894222418467205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,1536,0.017859554953045316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,256,0.00489066665371259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,1024,0.016011555989583332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,128,0.004344888859324985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,768,0.016134222348531086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,512,0.014478221535682678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,64,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,256,0.01346577786737018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,32,0.0039057777159743835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,128,0.01308444473478529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,64,0.013444444371594323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,12288,32,0.01512977812025282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,16384,0.06964621941248576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,65536,0.2625653213924832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,51200,0.20581689145829943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,65536,0.269174231423272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,51200,0.21275822321573892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,12288,0.05447555581728617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,10240,0.04537422127193875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,16384,0.07630311118231879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,12288,0.05888355440563626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,8192,0.03853333327505324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,7168,0.03377155462900797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,6144,0.029490666257010564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,10240,0.052199999491373696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,5120,0.025404444999165002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,8192,0.04516888989342583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,7168,0.03792622354295518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,4096,0.021911111142900255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,3584,0.01903377804491255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,6144,0.034282667769326106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,3072,0.01692800058258904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,5120,0.03046577837732103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,4096,0.025900445050663416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,3584,0.024456888437271118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,2048,0.0127697777416971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,12288,512,0.00628977765639623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,1536,0.01038577738735411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,1024,0.008607111043400234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,2560,0.02128622266981337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,2048,0.019183999962276883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,1536,0.017498667041460674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,512,0.005610666755172942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,768,0.015229332778188916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,256,0.004880889008442561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,512,0.014119111829333834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,128,0.004176889028814104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,256,0.013131555583741931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,64,0.0041991112132867174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,128,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,32,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,64,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,32,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,65536,0.22079732682969835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,2560,0.01475911173555586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,3072,0.0225600004196167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,65536,0.22693867153591582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,51200,0.1718684434890747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,10240,768,0.007274666594134436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,16384,0.05877066983116997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,12288,0.04531022244029575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,51200,0.1802497837278578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,10240,1024,0.015449777245521545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,16384,0.06565244330300225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,10240,0.03798310955365499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,8192,0.03255733185344272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,12288,0.05137066708670723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,7168,0.028399109840393066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,6144,0.024695111645592585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,10240,0.04527911212709215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,5120,0.021504888931910198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,8192,0.038648890124426946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,7168,0.032840887705485024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,4096,0.018840889135996502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,6144,0.02983022067281935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,3584,0.015951111912727356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,3072,0.0144533332851198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,2560,0.012343111137549082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,5120,0.025972444150182936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,4096,0.023383999864260357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,3584,0.022036444809701707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,2048,0.011015999648306104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,3072,0.020455999506844413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,1536,0.009304888546466827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,1024,0.007647111184067196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,2560,0.01963200006220076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,768,0.00591822216908137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,2048,0.01772533357143402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,512,0.004934222333961063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,1536,0.01601777805222405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,256,0.004181333300140169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,1024,0.014440000057220459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,128,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,768,0.014863111906581454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,64,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,512,0.013618666264745923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,8192,32,0.003540444291300244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,256,0.01275288893116845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,128,0.01238044434123569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,64,0.012132444315486483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,8192,32,0.01260355528857973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,16384,0.05474133292833964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,65536,0.20492000050014922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,12288,0.043282667795817055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,10240,0.03673333260748122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,65536,0.22134666972690156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,51200,0.17524266242980957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,16384,0.06445511182149251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,8192,0.031439112292395696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,12288,0.05091377761628893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,7168,0.027110222313139174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,6144,0.02397955622937944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,10240,0.04421866602367825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,5120,0.02032177812523312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,8192,0.036978665325376726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,4096,0.01682488951418135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,7168,0.0324577788511912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,3584,0.01499288943078783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,6144,0.028869334194395278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,3072,0.01383733335468504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,5120,0.025701334079106648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,2560,0.011969777444998423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,4096,0.023077333966890972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,2048,0.010632889138327705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,1536,0.008962666822804345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,3072,0.020344000723626878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,1024,0.006584888945023219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,2560,0.0192239996459749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,2048,0.017477333545684814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,768,0.00554577757914861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,512,0.004600000050332812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,1536,0.016024889217482675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,256,0.004179555508825514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,1024,0.014152000347773233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,128,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,512,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,256,0.012736000120639801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,64,0.00388711111413108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,32,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,128,0.012273777690198688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,64,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,7168,51200,0.1609786616431342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,32,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,65536,0.18080711364746094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,16384,0.04747822218471103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,51200,0.14498755666944715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,65536,0.18290311760372588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,51200,0.146579556994968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,12288,0.03637155559327867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,10240,0.03187111020088196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,16384,0.05490577883190579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,8192,0.026546667019526165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,12288,0.04367022381888496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,7168,0.02328266700108846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,10240,0.03664088911480374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,6144,0.020448888341585796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,8192,0.03161155515246921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,5120,0.017472889688279893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,7168,0.027170666389995154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,6144,0.025018667181332905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,4096,0.014800000521871777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,3584,0.013284444808959961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,5120,0.023007111416922674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,768,0.014722666806644864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,4096,0.020650666620996263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,3072,0.012477333347002665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,3584,0.01977244516213735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,2048,0.009667555491129557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,3072,0.018398221996095445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,2560,0.01724444495307075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,1536,0.008258666429254744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,1024,0.006646222124497096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,2048,0.015569777952300178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,768,0.005219555563396878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,1536,0.014488889111412896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,512,0.004579555657174853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,1024,0.01368622233470281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,256,0.00388711111413108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,768,0.013819555441538492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,128,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,512,0.013054221868515015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,64,0.0032808888289663526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,256,0.01237066669596566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,32,0.003530666646030214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,128,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,64,0.012088889049159156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,7168,3584,0.02219911085234748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,6144,32,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,65536,0.14653155538770887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,51200,0.11810933219061957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,16384,0.04356000158521864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,12288,0.03397866752412584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,65536,0.1804871161778768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,51200,0.14311999744839138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,10240,0.028765334023369685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,16384,0.05336622065967984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,8192,0.02441066669093238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,12288,0.04111822115050422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,7168,0.021583999196688335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,10240,0.03547733359866672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,6144,0.019034667147530448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,5120,0.01611555616060893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,8192,0.030806223551432293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,7168,0.026552889082166884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,4096,0.013643555343151093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,6144,0.02443644404411316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,3584,0.012113778127564324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,5120,0.022610666023360357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,4096,0.020303999384244282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,3584,0.01943466729587979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,2560,0.00962311112218433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,2048,0.008461332983440822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,3072,0.018173333671357896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,1536,0.007299555672539606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,2560,0.016472889317406546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,1024,0.005559111220969095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,192,128,128,0.020239111449983384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,1536,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,768,0.004879999905824661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,512,0.0041866666740841335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,1024,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,256,0.0038613333470291565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,768,0.013800889253616333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,128,0.003555555724435382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,512,0.01311466677321328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,64,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,256,0.01237155579858356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,32,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,128,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,6144,2560,0.010685332947307162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,64,0.012220444778601328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,32,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,51200,0.08960533142089844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,16384,0.03661155700683594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,65536,0.17224621772766113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,12288,0.029616001579496596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,51200,0.13777421580420599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,5120,3072,0.011152000062995486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,10240,0.023636443747414485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,8192,0.019864888654814828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,16384,0.05107644531461927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,12288,0.03878133495648702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,7168,0.017567111386193168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,10240,0.034190220965279475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,6144,0.015498666299713982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,8192,0.030135999123255413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,5120,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,7168,0.026362667481104534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,4096,0.012723555167516073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,3584,0.00944800012641483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,6144,0.024039111203617517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,5120,2048,0.01512977812025282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,5120,0.022379555635982092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,3072,0.008775999976529015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,2560,0.00793422261873881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,4096,0.02028888960679372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,2048,0.0069013333155049225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,3584,0.018901333212852478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,1536,0.005558222118351195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,3072,0.01681600014368693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,1024,0.004577777865860197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,2560,0.016211556063758004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,768,0.004538666870858935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,2048,0.01500266624821557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,512,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,1536,0.014270222849316068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,256,0.0034737777378824023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,1024,0.013185777597957186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,768,0.013807999591032663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,128,0.003479111111826367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,512,0.012808889150619507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,64,0.003198222153716617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,32,0.003334222154484855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,256,0.012103999654452005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,128,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,64,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,4096,32,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,65536,0.10280799865722656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,4096,65536,0.11398488945431179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,51200,0.08271555768118964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,16384,0.03414400087462531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,12288,0.027112000518374976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,10240,0.023942222197850544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,65536,0.1699697838889228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,16384,0.049717333581712514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,51200,0.1357004510031806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,8192,0.018608889646000333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,12288,0.03769155674510532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,7168,0.016864000095261466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,6144,0.01480977733929952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,10240,0.03353155652681986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,5120,0.013167111410035027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,8192,0.029480000336964924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,4096,0.011393778026103973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,7168,0.026269333230124578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,6144,0.023863111933072407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,3584,0.010255110760529837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,3072,0.00960000024901496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,5120,0.02200355629126231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,2560,0.008463111188676622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,4096,0.019480889042218525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,2048,0.007301333049933116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,1536,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,1024,0.004863111095296012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,3072,0.016532444291644625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,2560,0.016176889340082806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,768,0.004403555558787452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,2048,0.014825777875052558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,512,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,256,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,1024,0.013410666750537025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,128,0.0032035555276605818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,512,0.012738666600651212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,64,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,256,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3584,32,0.0032515554792351196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,128,0.011866666376590729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,64,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,65536,0.07880355252159967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,32,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,51200,0.06319377819697063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,16384,0.026613333159022864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,12288,0.02234933276971181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,65536,0.1327706707848443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,51200,0.10572266578674316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,10240,0.019537778364287484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,8192,0.017966222431924608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,12288,0.03084711233774821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,7168,0.016128889388508268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,10240,0.027740443746248882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,8192,0.025080889463424683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,3584,0.018000000052981906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,7168,0.02200355629126231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,5120,0.013034666577974955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,4096,0.012083555261294046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,1536,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,5120,0.019052444232834708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,3584,0.010297777752081553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,3072,0.00928177767329746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3584,768,0.013779555757840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,2560,0.008749333520730337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,3584,0.015818667080667283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,2048,0.0075911109646161394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,3072,0.014793778459231058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,1536,0.006183111005359226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,2048,0.013758222262064615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,1024,0.004875555634498596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,1536,0.013430222041077085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,768,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,1024,0.01278222186697854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,16384,0.03914489017592536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,512,0.0038693332009845306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,768,0.013406222065289816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,256,0.003632889025741153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,128,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,512,0.012454222473833295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,256,0.012086222569147745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,6144,0.014877332581414117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,128,0.011438222395049201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,3072,32,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,64,0.011426666544543372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,65536,0.07530933618545532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,32,0.011371555427710215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,51200,0.06045155392752754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,16384,0.025401777691311304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,4096,0.017047999633683097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,12288,0.021357332666714985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,10240,0.01868088874551985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,65536,0.12896354993184408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,51200,0.10334044694900513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,16384,0.03804711169666714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,8192,0.015283554792404175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,12288,0.03019022279315525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,7168,0.013618666264745923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,2560,0.014488000008794995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,10240,0.027077333794699773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,6144,0.012180444267061023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,5120,0.010938666760921478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,4096,0.00963644435008367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,8192,0.024664888779322307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,3584,0.008965333302815756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,7168,0.021535111798180476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,6144,0.020131554868486192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,3072,0.007995555798212687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,5120,0.01809777816136678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,4096,0.01685422162214915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,2048,0.00628266649113761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,3584,0.015454222758611044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,3072,0.014785778191354541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,1536,0.005565333283609814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,2560,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,768,0.00433688900536961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,2048,0.013821333646774292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,1536,0.013416888813177744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,512,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,1024,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,256,0.003536000019974179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,128,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,768,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,512,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,256,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,32,0.002990222225586573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,128,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,3072,6144,0.020605333977275424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,64,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,65536,0.06079822116427951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2560,32,0.011145778000354767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,51200,0.049286223120159574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,16384,0.021609778205553692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,65536,0.12516000535753039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,12288,0.017895999881956313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,51200,0.10032977660497029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,10240,0.017172444197866652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,16384,0.03705688979890611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,8192,0.016211556063758004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,12288,0.029509332444932725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,7168,0.01534577707449595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,10240,0.026876444617907207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,6144,0.01146133326821857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,8192,0.02416977783044179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,5120,0.010316444767846001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,4096,0.009292444421185387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,2560,0.007248889240953658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,3584,0.008624888956546783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,6144,0.019596444235907663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,5120,0.017509332961506315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,3072,0.007621333003044128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,1024,0.004564444637960858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,4096,0.015992000699043274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,2560,0.006666666517655055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,2048,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,1536,0.005230222311284807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,2560,0.014155555102560254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,2048,0.013791110780504016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,1024,0.004237333519591225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,768,0.0041777777175108595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2560,64,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,1536,0.013252444565296173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,512,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,256,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,1024,0.0127688886390792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,128,0.003198222153716617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,768,0.01275111072593265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,512,0.012278222375445895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,64,0.0028560000161329904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,2048,32,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,256,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,128,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,65536,0.046089778343836464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,64,0.011104889214038849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,32,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,51200,0.036978665325376726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,16384,0.017902221944597032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,12288,0.01482222146458096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,65536,0.12244178189171685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,16384,0.03605066736539205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,10240,0.013906665974193148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,12288,0.029462221595976088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,7168,0.020928000410397846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,8192,0.014800000521871777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,7168,0.013097777962684631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,10240,0.026383111874262493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,6144,0.01236533373594284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,8192,0.023317333724763658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,3584,0.015480000111791821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,5120,0.01034222212102678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,2048,3072,0.014783110883500842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,7168,0.02030755579471588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,4096,0.00907555553648207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,3584,0.007975111405054728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,6144,0.018562666243977018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,3072,0.007290666302045186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,5120,0.017470222380426195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,2560,0.006533333410819371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,4096,0.015855999456511605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,2048,0.0058453331391016645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,1536,0.004912888838185204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,3072,0.014514666464593677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,1024,0.004182222402758068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,2560,0.014167111780908374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,2048,0.01368533323208491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,768,0.0039048890272776284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,1536,0.013081777426931592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,512,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,256,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,1024,0.012433778080675336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,768,0.012793777717484368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,512,0.012090666426552666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,256,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,64,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,32,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,128,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,51200,0.09799466530481975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,65536,0.03450311223665873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,64,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,32,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,51200,0.02767466670937008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,16384,0.016368889146380954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,12288,0.014070222775141398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,51200,0.09520355860392253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,16384,0.035659554931852556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,10240,0.012492444780137805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,12288,0.028561777538723413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,8192,0.011424889167149862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,7168,0.011000889043013254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,10240,0.02567911148071289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,6144,0.010664000279373594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,7168,0.01995377739270528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,5120,0.009388444324334463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,6144,0.018589332699775696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,4096,0.007961778177155389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,5120,0.017238222890430026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,3584,0.007303111255168915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,4096,0.016027554869651794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,3072,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,3584,0.015276443627145557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,2560,0.006221333311663733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,3072,0.014487110906177096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,2048,0.005200888961553574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,2560,0.014162666267818876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,1536,0.004911111046870549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,1024,0.0041991112132867174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,2048,0.013463999662134381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,768,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,65536,0.11947733826107448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,1536,0.013096888860066732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,512,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,256,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,1024,0.012624888784355588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,128,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,768,0.012738666600651212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,512,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,256,0.011771555576059552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,32,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,128,0.011773332953453064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1536,3584,0.015121777852376303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,64,0.011397333608733283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,65536,0.0306328899330563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,51200,0.02609599961174859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,32,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,16384,0.013188444077968597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,12288,0.011719110939237805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,65536,0.11769421895345052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,51200,0.0940764413939582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,10240,0.013448889056841532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1536,128,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,16384,0.03520088725619846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,8192,0.011990221838156382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,12288,0.027887112564510767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,6144,0.010001777774757808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,10240,0.024693333440356787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,8192,0.022011554903454248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,5120,0.009010666774378883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,4096,0.00795022232664956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,6144,0.018254222141371835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,5120,0.01720177796151903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,3584,0.007257777783605788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,4096,0.01585155559910668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,3072,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,3584,0.01512888901763492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,2560,0.005942222144868638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,3072,0.014488000008794995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,2048,0.0063031112982167145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,1024,64,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,1536,0.005207111024194294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,2560,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,1024,0.004591111093759537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,2048,0.013471999930010902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,768,0.003900444342030419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,1536,0.013136000268989138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,512,0.0032791110376516977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,1024,0.0123848890264829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,256,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,768,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,128,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,512,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,64,0.0025191110455327565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,7168,0.011306666665607028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,768,32,0.002895111011134254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,128,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,64,0.011683555940786997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,7168,0.019578667150603402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,65536,0.025045333637131587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,51200,0.021038222644064162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,32,0.011038222246699862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,16384,0.013732444081041547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,12288,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,65536,0.11543822288513184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,16384,0.03424711028734843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,10240,0.011003555523024665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,8192,0.009294222626421187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,10240,0.024352888266245525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,7168,0.008962666822804345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,1024,8192,0.02211644417709774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,8192,0.021902221772405837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,6144,0.009015999734401703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,5120,0.008281778130266402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,4096,0.007654222349325816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,7168,0.01963200006220076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,6144,0.0185208883550432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,3584,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,5120,0.017222222354676988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,3072,0.006305777778228124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,4096,0.015840000576443143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,3584,0.01516533394654592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,3072,0.014576888746685453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,2048,0.005191111316283544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,2560,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,1536,0.004541333350870344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,768,256,0.011800000237094032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,1024,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,768,0.0035075553589397003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,2048,0.01368711143732071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,512,0.0035333335399627686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,1536,0.013056000073750814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,1024,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,256,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,128,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,512,0.012450666891203986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,256,0.011808888779746162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,51200,0.09245066510306464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,64,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,32,0.0025235555238193935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,65536,0.020568889048364427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,12288,0.027058665951093037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,64,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,51200,0.018231999542978074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,32,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,16384,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,12288,0.010022222167915767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,65536,0.11425777276357015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,16384,0.03325155708524916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,51200,0.0899146662818061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,10240,0.009554666777451834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,8192,0.00868088917599784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,12288,0.027077333794699773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,7168,0.007978666987684038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,6144,0.007647111184067196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,10240,0.0243511117166943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,8192,0.021672000487645466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,512,2560,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,5120,0.0083137775460879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,7168,0.01956355571746826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,4096,0.007595555649863348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,3584,0.006933333145247565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,6144,0.018230222993426852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,3072,0.006223111102978389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,5120,0.01715555621518029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,2560,0.005596444424655702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,4096,0.015853333804342482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,2048,0.005220444252093633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,3584,0.014836443795098199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,1536,0.004520888957712385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,3072,0.014141332772043018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,1024,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,2560,0.014106666048367819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,2048,0.013463111387358772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,768,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,1536,0.013038222160604266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,512,0.0031866667171319327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,256,0.0030862221287356485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,1024,0.012381333443853589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,128,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,64,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,512,0.012123555772834353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,256,32,0.002534222271707323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,128,0.011698666546079846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,128,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,65536,0.014876445134480795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,64,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,51200,0.013441777891582914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,32,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,16384,0.009351111120647853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,12288,0.00999466660949919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,65536,0.11210755507151286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,51200,0.08882311317655776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,10240,0.009304888546466827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,8192,0.00831733312871721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,12288,0.02672622270054287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,7168,0.007992000215583378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,10240,0.02382133404413859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,8192,0.021321778496106465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,6144,0.00868444475862715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,5120,0.00795377790927887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,7168,0.01956622302532196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,4096,0.0074026667409473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,6144,0.017906667457686532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,5120,0.016765332884258695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,4096,0.015480889214409722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,3072,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,3584,0.014808000789748298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,512,768,0.01238933371173011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,2560,0.00555288874440723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,2048,0.004864000197913912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,768,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,3072,0.014133334159851074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,256,256,0.012011555333932241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,1536,0.004548444516128964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,2560,0.013461333182122974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,1024,0.003867555409669876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,768,0.0035422220826148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,2048,0.013067555924256643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,1536,0.012811555630630918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,1024,0.012295111185974546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,768,0.0127688886390792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,128,0.00267999991774559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,512,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,64,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,16384,0.03298844562636481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,32,0.002551111082235972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,128,0.011648000114493899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,65536,0.014456889695591398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,32,0.011553777588738335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,51200,0.014484445254007975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,65536,0.11177155706617568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,16384,0.009358222285906473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,3584,0.006623999940024481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,51200,0.08849689033296372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,16384,0.03293066554599338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,10240,0.009008000294367472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,12288,0.026797332697444495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,8192,0.008025777836640676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,10240,0.024382222029897902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,512,0.0032711111836963226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,7168,0.009006222089131674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,8192,0.02161688937081231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,6144,0.008492444124486711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,128,256,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,5120,0.008032889001899296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,4096,0.007272889216740926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,7168,0.019296889503796894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,6144,0.0184888889392217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,3584,0.006978666616810693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,256,0.01145244472556644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,5120,0.01688088807794783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,3072,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,2560,0.005542222410440445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,4096,0.015847111741701763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,2048,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,1536,0.004567111117972268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,3584,0.015154666370815702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,3072,0.014161777165200977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,1024,0.003661333272854487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,2560,0.013585777746306526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,768,0.0035502223504914176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,2048,0.013431111143694984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,512,0.0032257777121331957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,1536,0.013071999781661563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,256,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,1024,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,128,0.002537777854336633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,768,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,64,0.002540444541308615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,32,0.0026568888376156488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,512,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,256,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,64,12288,0.009696889254781935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,128,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,65536,0.01515111161602868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,64,0.011013333168294696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,51200,0.013767110804716745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,64,32,0.01144444445768992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,16384,0.009318222602208456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,12288,0.009869332942697737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,10240,0.008987555901209513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,65536,0.11072799894544814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,51200,0.0865208903948466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,16384,0.0328764451874627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,12288,0.026769777139027912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,8192,0.007620444728268518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,7168,0.008986666798591614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,6144,0.008348444269763099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,10240,0.02404088940885332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,5120,0.007416889071464539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,4096,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,8192,0.021485333641370136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,7168,0.0195795562532213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,3584,0.0069653333889113525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,6144,0.018180444836616516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,3072,0.006275555739800136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,5120,0.017165333032608032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,2560,0.005629333357016246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,2048,0.004963555683692296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,3584,0.014833778142929077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,1536,0.004511111312442356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,3072,0.014094221923086377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,2560,0.014089778065681458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,1024,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,768,0.003555555724435382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,2048,0.013388444152143268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,512,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,1536,0.012736000120639801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,256,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,1024,0.012488000094890594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,128,0.00254133323000537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,512,0.012327999704413943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,128,0.011482666763994427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,161,32,32,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,64,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,32,0.011372444530328115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,4096,0.015463110473420886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,128,64,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,768,0.012108444339699216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,16384,0.3504630989498562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,161,32,256,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,51200,0.8965902328491211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,51200,1.0902320014105904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,16384,0.2968168788486057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,12288,0.2645680109659831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,10240,0.23530488544040254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,12288,0.21887466642591688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,10240,0.18570933077070448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,8192,0.19422133763631186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,8192,0.15285332997639975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,7168,0.16784444120195177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,7168,0.13150044282277426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,6144,0.1433253288269043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,6144,0.11436088879903157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,8192,0.167632884449429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,12288,0.2398888799879286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,10240,0.2020275592803955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,5120,0.12205955717298721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,16384,0.31806932555304634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,4096,0.10293333397971259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,7168,0.14897955788506403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,5120,0.09701510932710435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,3584,0.087391111585829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,4096,0.08093600140677558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,6144,0.13202755981021458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,3072,0.07640800211164686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,3584,0.07234578000174628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,5120,0.11396266354454888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,2560,0.06268178092108832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,3072,0.06412355767356025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,2560,0.05679644478691948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,4096,0.09807733032438491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,2048,0.05139822098943922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,3584,0.08864800135294597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,1536,0.03984266519546509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,3072,0.08160177866617839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,2048,0.04920088913705614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,1024,0.02985422147644891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,2560,0.07299644417232938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,1536,0.040720889965693154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,768,0.02247911029391819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,2048,0.06527200010087755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,512,0.016215999921162922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,1024,0.04855822192298042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,768,0.029208001163270738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,1536,0.05687555339601305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,768,0.046592000457975596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,1024,0.0335440006521013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,128,0.009311999711725447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,512,0.02507200009293026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,512,0.0410462220509847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,256,0.03503288825352987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,256,0.022597332795461018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,64,0.008316444853941599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,128,0.02145511077509986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,32,0.008354666332403818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,128,0.02971022327740987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,32,0.028436445527606543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,65536,64,0.020928889513015747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,65536,256,0.010327111515733931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,51200,0.718598206837972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,51200,0.9019795523749458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,65536,1.142883512708876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,65536,0.9251893361409506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,16384,0.28987110985649955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,12288,0.2238710986243354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,16384,0.23663910230000815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,12288,0.17627644538879395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,10240,0.16984711752997506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,10240,0.150163557794359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,65536,51200,0.964729732937283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,8192,0.140721771452162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,8192,0.13685688707563612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,7168,0.12289510832892524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,7168,0.1094684468375312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,10240,0.17362756199306914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,12288,0.20440622170766196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,16384,0.26388711399502224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,8192,0.14453155464596218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,5120,0.09018577469719781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,6144,0.09376711315578884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,6144,0.1049191090795729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,4096,0.07550044192208184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,4096,0.06725688775380452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,7168,0.1292195585038927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,6144,0.11559555265638564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,5120,0.1001288890838623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,3584,0.06544622447755602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,3072,0.057651552889082164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,3584,0.060646222697363965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,4096,0.08672889073689778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,3072,0.05380710959434509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,2560,0.04893777767817179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,3584,0.07932977543936835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,3072,0.07322221994400024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,2048,0.04025333457522922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,2048,0.041682667202419706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,2560,0.04759644468625387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,2048,0.05944889121585422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,1536,0.03198933270242479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,1024,0.02442844377623664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,1536,0.03561866614553664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,5120,0.0804542236857944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,768,0.01817599932352702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,1536,0.05207111106978523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,512,0.013029333617952136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,1024,0.045026666588253446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,768,0.024215110474162634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,768,0.04049244523048401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,1024,0.02900444467862447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,256,0.009300444689061906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,128,0.0074337778819931885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,512,0.022276444567574397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,512,0.036664889918433294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,256,0.033352000845803156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,256,0.020241777102152508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,64,0.005903111149867375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,51200,32,0.0059368887709246735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,128,0.02798488736152649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,128,0.018793778287039865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,64,0.018897778458065458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,51200,32,0.01882844501071506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,51200,0.8330826759338379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,65536,0.3778284390767415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,2560,0.06662044260236952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,51200,0.29581067297193736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,51200,0.2888524532318115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,16384,0.0985048876868354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,65536,0.3661795457204183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,12288,0.07583644655015734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,16384,0.10036533408694798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,10240,0.06290666924582587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,51200,65536,1.0604675081041124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,12288,0.07654222514894274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,10240,0.06715022193060981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,8192,0.05616622500949436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,8192,0.05736977524227566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,16384,0.11855555905236138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,7168,0.04945955673853556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,10240,0.08406133121914333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,6144,0.043226665920681424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,8192,0.07335288657082452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,7168,0.04849244488610161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,5120,0.034727109803093806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,6144,0.04355555441644457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,7168,0.06625511248906453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,4096,0.029157333903842505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,6144,0.06420799758699205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,5120,0.03813866774241129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,3584,0.0258942229880227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,4096,0.03343377841843499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,5120,0.05494222376081678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,4096,0.04880533284611172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,3072,0.023034666975339253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,3584,0.03013155526585049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,2560,0.01926933394538032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,3584,0.045604444212383695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,3072,0.02741866641574436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,3072,0.04361777835422092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,2560,0.024430221981472437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,2560,0.04008888867166307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,65536,0.4107040034400092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,1536,0.012978666358523898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,51200,0.32453687985738117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,2048,0.03755822115474277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,2048,0.02239822182390425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,1536,0.03418044580353631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,1024,0.010397333237859938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,12288,0.09433155589633518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,1536,0.020227554771635268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,1024,0.017667555146747164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,1024,0.031544887357287936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,768,0.031327111853493586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,256,0.0052062223354975385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,512,0.02782577938503689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,768,0.01683288812637329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,128,0.004226666771703296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,256,0.025019556283950806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,16384,128,0.022630222969584998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,128,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,64,0.004015999949640698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,32,0.003955555458863576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,64,0.013454222016864352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,32,0.015857777661747403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,2048,0.016132444143295288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,65536,0.27608267466227215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,768,0.008608889248636033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,65536,0.28102045589023167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,16384,512,0.007233777807818518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,51200,0.21594044897291395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,16384,0.07329689131842719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,512,0.015115555789735583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,51200,0.22415288289388022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,12288,0.05738311343722873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,16384,256,0.014392889208263822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,10240,0.04742044541570875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,12288,0.06101422177420723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,16384,0.11724177996317546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,12288,0.09381244579950969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,10240,0.053716444306903414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,10240,0.0825128886434767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,8192,0.04685777756902906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,7168,0.03488533364401923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,8192,0.07255288627412584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,6144,0.03038755390379164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,7168,0.039113776551352605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,7168,0.06520977947447035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,65536,0.40129688051011825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,5120,0.026760889424218073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,51200,0.31636977195739746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,6144,0.03547822104560004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,6144,0.05999200211630928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,4096,0.022664000590642292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,5120,0.03154222170511881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,3584,0.01949155496226417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,5120,0.053611556688944496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,16384,0.07926222350862291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,4096,0.027095999982621934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,3072,0.017493334081437852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,2560,0.014519110321998596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,3584,0.024775111012988623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,3072,0.02296177711751726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,3072,0.04247466723124186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,2560,0.021310221817758348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,2048,0.012714666624863943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,2560,0.03946400019857619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,1536,0.010657777388890585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,1024,0.008639111287064022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,8192,0.04047377904256185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,2048,0.03744533326890733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,2048,0.019905777441130746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,768,0.0075911109646161394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,1536,0.01815111107296414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,512,0.005574222240183089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,1024,0.02881511052449544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,1024,0.015777778294351365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,256,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,768,0.029096000724368628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,768,0.014785778191354541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,512,0.026775999201668635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,128,0.003896000070704354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,512,0.014473777678277759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,64,0.0038862224254343244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,256,0.013447110851605734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,12288,32,0.0041848888827694785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,128,0.013063111239009433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,64,0.013559111290507846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,12288,32,0.01309866706530253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,65536,0.2468737761179606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,4096,0.04825599988301595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,65536,0.26785866419474286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,51200,0.19386755095587838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,3584,0.0453342232439253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,16384,0.06512000163396199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,51200,0.2113786670896742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,1536,0.034260445170932345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,16384,0.07630933655632867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,12288,0.05128444565667046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,12288,0.059471997949812144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,128,0.021653332644038733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,16384,0.11645421716901992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,10240,0.0428071121374766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,12288,0.09306489096747504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,8192,0.036539554595947266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,10240,0.052163554562462695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,7168,0.031926221317715116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,8192,0.04519822200139364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,10240,0.0823813345697191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,6144,0.027888000011444092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,8192,0.07202666335635714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,7168,0.037985778517193265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,7168,0.06455377737681071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,6144,0.034493333763546415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,51200,0.314976003434923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,4096,0.020792000823550753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,5120,0.03030222323205736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,5120,0.05294488867123922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,3584,0.018193778064515855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,4096,0.02604622145493825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,4096,0.04697155621316698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,3072,0.016043555405404832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,3584,0.044192890326182045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,12288,256,0.025011556016074285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,3072,0.02257599929968516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,2560,0.014176888598336114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,2560,0.02087644404835171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,2560,0.039353777964909874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,2048,0.0120328888297081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,2048,0.03657333387268914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,2048,0.01919911139541202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,1536,0.010024888647927178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,65536,0.39759378963046604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,1024,0.008656000097592672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,5120,0.024307555622524683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,1536,0.017500445246696472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,768,0.00655644428398874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,6144,0.05985244115193685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,1024,0.030031998952229817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,1024,0.015215999550289579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,512,0.005570666657553778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,768,0.028038223584493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,768,0.014745778507656522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,512,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,256,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,128,0.003909333298603694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,256,0.024380443824662104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,256,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,128,0.012814222110642327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,64,0.003565333369705412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,10240,32,0.0038311113086011675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,128,0.02142488956451416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,3072,0.04204444421662224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,64,0.013120888835854001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,32,0.013298666311634911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,65536,0.1873413324356079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,51200,0.142758223745558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,65536,0.22501420974731445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,16384,0.04925688770082262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,51200,0.1793351173400879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,1536,0.033653332127465144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,12288,0.03856089048915439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,16384,0.06567466921276517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,10240,512,0.026446221603287592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,16384,0.08464622497558594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,10240,0.03228800164328681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,12288,0.06868000162972344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,10240,3584,0.024453333682484094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,8192,0.028190222051408555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,10240,0.045365333557128906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,10240,0.06186311112509834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,8192,0.038853334056006536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,65536,0.2621973355611165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,51200,0.21097777949439156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,6144,0.021545777718226116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,7168,0.03314310974544949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,7168,0.04926044411129422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,5120,0.01850044396188524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,6144,0.029888888200124104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,4096,0.015999111864301894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,6144,0.04628888765970866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,5120,0.04186311033036974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,5120,0.02646844420168135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,3584,0.013752000199423896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,4096,0.03867377837498983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,4096,0.023197333017985027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,3072,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,3584,0.022072000635994807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,3584,0.03661777906947666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,2560,0.010759111079904767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,2048,0.009676444033781687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,3072,0.035608887672424316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,3072,0.020629333125220407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,2560,0.019440889358520508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,2560,0.033759110503726535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,1536,0.00814844419558843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,12288,0.05156711075041029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,1024,0.006607111129495833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,2048,0.017853332890404593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,2048,0.03230399886767069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,768,0.0052435555391841466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,1536,0.027973333994547527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,1024,0.026159110996458266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,1024,0.01443377799457974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,512,0.004229333251714706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,768,0.025356445047590468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,7168,0.024355555574099224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,768,0.014091556270917257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,256,0.003571555432346132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,128,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,8192,0.054027554061677724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,512,0.013411555853154926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,512,0.025398222936524287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,256,0.02336888843112522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,256,0.0127697777416971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,32,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,8192,128,0.020248000820477802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,128,0.012226666841242047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,64,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,32,0.0124195557501581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,65536,0.1671911080678304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,51200,0.12999199496375188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,65536,0.22051110532548693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,16384,0.04567911227544149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,51200,0.17505155669318306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,16384,0.06436266501744588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,12288,0.036567111810048424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,16384,0.08302666743596394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,12288,0.050563553969065346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,8192,1536,0.016528889536857605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,10240,0.030552887254291113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,12288,0.06770755847295125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,8192,0.025681777132882014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,51200,0.207367115550571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,10240,0.04400711258252462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,8192,0.037625776396857366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,10240,0.06114221943749321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,65536,0.2580711046854655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,8192,64,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,6144,0.019674667053752475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,8192,0.05407911207940844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,7168,0.02267733381854163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,5120,0.016960889101028442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,7168,0.03195200032658047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,4096,0.015071999695565967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,7168,0.04833244283994039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,6144,0.029447111818525527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,6144,0.045143110884560474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,5120,0.025976000560654536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,5120,0.04082577758365207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,3072,0.012031111452314587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,4096,0.02307022280163235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,3584,0.02176800039079454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,3584,0.03570400012864007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,3072,0.020555555820465088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,3072,0.03503111004829407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,2048,0.009209777745935652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,2560,0.033442666133244835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,2560,0.019112888309690688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,1536,0.007696888513035244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,2048,0.01795111099878947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,2048,0.03195733494228787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,1024,0.005912000106440649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,1536,0.015473778049151102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,768,0.005156444592608346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,1024,0.02593333356910282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,768,0.013907555076811047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,768,0.025408888856569927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,512,0.004221333397759331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,512,0.02461066676510705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,512,0.013403555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,256,0.0038648889296584656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,256,0.02292799949645996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,256,0.01277599980433782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,3584,0.01310488912794325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,4096,0.03840533230039809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,64,0.0031928889867332247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,128,0.020280889338917203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,32,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,64,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,32,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,65536,0.15221956041124132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,7168,1536,0.027796443965699937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,51200,0.12255999777052139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,1024,0.014455111490355598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,65536,0.18322400252024332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,16384,0.04228711128234863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,51200,0.14621155791812473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,16384,0.05470755696296692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,12288,0.0335457788573371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,16384,0.07855821980370416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,12288,0.043459554513295494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,12288,0.0654933320151435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,10240,0.028213332096735638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,128,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,8192,0.02442933287885454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,65536,0.2435671223534478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,10240,0.03738488753636678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,7168,2560,0.010307555397351583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,10240,0.05870755513509115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,7168,0.0210826661851671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,6144,0.01867022282547421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,8192,0.03161333335770501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,8192,0.052258667018678456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,7168,0.027229333917299908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,5120,0.0158942225906584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,7168,0.046930667426851064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,4096,0.013827555709415011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,6144,0.044234666559431285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,5120,0.022944000032213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,3584,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,4096,0.03716889023780823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,4096,0.020984888076782227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,3072,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,3584,0.035375111632876925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,3584,0.019710222880045574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,2560,0.011351111034552256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,3072,0.01887822151184082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,3072,0.03431111243036058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,2048,0.010023111270533668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,2560,0.017222222354676988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,2560,0.03266755408710904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,1536,0.0083155557513237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,2048,0.016490666402710807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,2048,0.030827555391523574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,1024,0.0069448889957533936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,1536,0.014846222268210517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,1536,0.027481777800454035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,7168,128,0.012406222522258759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,768,0.0052328887912962176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,1024,0.013753777576817406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,1024,0.026438222991095647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,512,0.004856889032655292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,768,0.024710221423043147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,768,0.013412444127930535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,256,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,512,0.024659555819299486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,6144,0.024958221448792353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,128,0.003530666646030214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,256,0.012451555165979596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,5120,0.03973333372010125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,128,0.02000177734427982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,128,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,32,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,64,0.011768889096048145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,32,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,65536,0.140775998433431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,51200,0.1127013365427653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,65536,0.1797004408306546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,51200,0.1401617791917589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,16384,0.04576889011594984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,16384,0.05304444498485989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,6144,512,0.013148444394270578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,12288,0.035240888595581055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,51200,0.19320978058709037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,256,0.022653333014912073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,10240,0.0302782224284278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,16384,0.07840800285339355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,12288,0.041803555356131665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,12288,0.06464178032345243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,8192,0.025495999389224585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,10240,0.034796443250444196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,7168,0.022660444180170696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,10240,0.05771555503209432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,8192,0.03090488910675049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,8192,0.05178222060203552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,6144,0.019578667150603402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,7168,0.026965333355797663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,7168,0.04674222071965536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,5120,0.016812443733215332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,6144,0.024850666522979736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,6144,0.04328711165322197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,4096,0.014115555418862237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,5120,0.02260533306333754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,5120,0.03945777813593546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,3584,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,4096,0.03710577885309855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,6144,51200,0.19533067279391816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,3072,0.011375111010339526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,3584,0.019564444820086162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,3584,0.034797334008746676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,2560,0.00998222248421775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,3072,0.034188446071412824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,65536,0.24244621064927843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,3072,0.018194667167133756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,2048,0.008636444807052612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,2560,0.01692800058258904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,2560,0.03173333406448364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,1536,0.007613333563009898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,1024,0.005913777897755305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,2048,0.02844088938501146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,6144,64,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,1536,0.026426666312747534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,1536,0.014152889450391134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,768,0.004872000051869286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,1024,0.013771555489963956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,512,0.004221333397759331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,1024,0.025407999753952026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,768,0.0243493335114585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,768,0.013066666821638743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,256,0.0038977778620190094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,512,0.02502044373088413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,256,0.012172444827026792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,128,0.003547555456558863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,256,0.022287999590237934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,64,0.0031866667171319327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,5120,128,0.020939555433061387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,128,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,5120,32,0.0031928889867332247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,64,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,32,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,65536,0.09911555714077419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,4096,0.020558221472634208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,51200,0.07995111412472196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,65536,0.17184621757931182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,16384,0.034520887666278414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,51200,0.13731555143992105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,2048,0.015127110812399121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,16384,0.050889776812659375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,12288,0.02716444432735443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,16384,0.07793866925769381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,10240,0.019976889093716938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,65536,0.23908445570203993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,12288,0.06385066774156359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,5120,512,0.01309333327743742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,51200,0.1925742228825887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,10240,0.033969776497946844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,7168,0.015034667319721647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,10240,0.05720800161361694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,8192,0.030064000023735896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,7168,0.0461768905321757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,7168,0.026367111338509455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,5120,0.011733333269755045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,6144,0.024339555038346186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,6144,0.0435697767469618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,4096,0.01033688916100396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,5120,0.022226666410764057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,5120,0.03927910990185208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,3584,0.009341333475377824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,4096,0.036151111125946045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,4096,0.020304888486862183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,3072,0.00832266691658232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,3584,0.018969777557584975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,3584,0.034112887250052557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,2560,0.007616889145639207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,3072,0.017456889152526855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,3072,0.031911111540264554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,2048,0.006576889091067844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,2560,0.01651022169325087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,2560,0.03047555685043335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,12288,0.039048890272776283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,1536,0.005597333527273602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,2048,0.01511111193233066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,8192,0.017248888810475666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,1024,0.004524444540341695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,2048,0.02811466654141744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,768,0.0041235557032956015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,1536,0.027080888549486797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,1536,0.014103111293580798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,1024,0.025056888659795124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,6144,0.013579555683665805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,1024,0.013418667018413544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,256,0.0032275555034478507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,768,0.02466933263672723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,512,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,512,0.024433778391944036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,256,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,256,0.023018666439586218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,64,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,128,0.011904000408119626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,128,0.019738665885395475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,32,0.0028515555378463534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,64,0.012368888490729861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,65536,0.09266577826605903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,32,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,51200,0.07426133420732287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,65536,0.16899732748667398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,51200,0.13531733883751765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,16384,0.030864887767367895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,512,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,4096,8192,0.05098399851057264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,65536,0.23753600650363496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,16384,0.0488373339176178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,12288,0.025378665990299646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,10240,0.021980444590250652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,51200,0.19123466809590658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,16384,0.07807022333145142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,12288,0.038444442881478205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,4096,128,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,8192,0.01613333324591319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,7168,0.014838222000333997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,10240,0.033899555603663124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,10240,0.056886222627427846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,8192,0.05074844426578946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,8192,0.029870222012201946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,6144,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,7168,0.026194666822751362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,7168,0.04605422086185879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,5120,0.011384888655609555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,6144,0.042986667818493314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,4096,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,5120,0.021941334009170532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,5120,0.039373334911134504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,3584,0.010747555229398938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,4096,0.019904888338512845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,3584,0.018248000078731112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,3584,0.03438577718204922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,3072,0.00831733312871721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,2560,0.007546666595670912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,3072,0.03391644358634949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,3072,0.01716800034046173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,4096,768,0.013108444710572561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,2048,0.006562666760550604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,2560,0.015592889653311836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,2560,0.030187557140986126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,1536,0.0052675555149714155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,2048,0.01480888823668162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,12288,0.06306044260660808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,1024,0.00452888881166776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,1536,0.014465777410401238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,1536,0.025846223036448162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,768,0.0038782221575578055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,1024,0.024193776978386775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,1024,0.013423110875818463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,512,0.003714666598372989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,768,0.012774222426944308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,768,0.025759999950726826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,256,0.003216888962520493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,512,0.012676444318559436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,512,0.02365422248840332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,6144,0.024107555548350017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,128,0.0032257777121331957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,64,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,256,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,128,0.020615999897321064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3584,32,0.0031928889867332247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,4096,0.036729776197009616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,64,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,65536,0.07929778099060059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,32,0.012079999678664737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,51200,0.06261599726147123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,65536,0.1278195513619317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,51200,0.10527910788853963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,16384,0.026774222652117412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,2048,0.02810133496920268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,16384,0.07750933037863837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,65536,0.23775643772549102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,12288,0.02295733326011234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,51200,0.19044710530175102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,10240,0.02271822260485755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,12288,0.06288266844219632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,12288,0.030478222502602473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,8192,0.018567999203999836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,10240,0.05670844184027778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,7168,0.01717066599263085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,8192,0.025115556187099878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,8192,0.05044622222582499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3584,256,0.021937777598698933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,7168,0.022125333547592163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3584,128,0.011760888828171624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,5120,0.013391111459996967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,7168,0.04590222239494324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,6144,0.020344000723626878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,6144,0.043248001072141856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,4096,0.011694221860832639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,5120,0.03963288995954726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,3584,0.010657777388890585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,4096,0.017112000121010672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,4096,0.03598577777544657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,3072,0.009319110876984065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,3584,0.016131555040677387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,3584,0.03347288899951511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,2560,0.008616888688670265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,3072,0.015061333775520325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,3072,0.03160444564289517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,2048,0.007265778051482306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,2560,0.0144195556640625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,2560,0.029785778787400987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,1536,0.0058782220714622075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,2048,0.013853333062595792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,2048,0.02883466747072008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,10240,0.027797334724002417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,1024,0.004869333157936732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,1536,0.013375110924243927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,1536,0.026774222652117412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,768,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,1024,0.024671110841963027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,1024,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,512,0.003568888952334722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,6144,0.015433778365453085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,768,0.023659555448426142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,256,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,768,0.01254666679435306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,128,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,512,0.024273778001467388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,512,0.012608889076444836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,64,0.003023111157947116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,256,0.022309333086013794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,3072,32,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,3072,128,0.020232000284724765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,65536,0.06879555516772799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,64,0.012107555237081317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,32,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,51200,0.055288000239266284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,65536,0.12776354948679605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,16384,0.039517333110173546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,16384,0.023352000448438857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,51200,0.10190577639473809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,65536,0.23736710018581816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,12288,0.019924443629052904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,16384,0.07669599850972493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,51200,0.1904391050338745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,10240,0.017676444517241586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,12288,0.030617776844236586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,12288,0.06266311142179701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,8192,0.016918222109476726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,10240,0.02745955520206028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,10240,0.055995557043287486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,7168,0.016367110941145156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,256,0.011773332953453064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,8192,0.024775111012988623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,5120,0.019136889113320243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,6144,0.013917333549923368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,8192,0.05026577909787496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,5120,0.011587555209795633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,7168,0.02197866638501485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,6144,0.0421999990940094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,6144,0.02034133341577318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,4096,0.01070577816830741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,5120,0.018651554981867473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,5120,0.03749777873357137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,3584,0.009298666483826106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,4096,0.016252444850073922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,4096,0.03399466805987888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,3072,0.008952889177534316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,3584,0.032241778241263494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,3584,0.01579466627703773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,2560,0.007600000335110559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,3072,0.014781332678265043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,3072,0.031202667289310034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,2048,0.006804444309737947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,2560,0.014128888646761576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,2560,0.029905776182810467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,16384,0.037782222032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,1536,0.005574222240183089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,2048,0.02780888809098138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,1024,0.004563555535342959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,1536,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,1536,0.026378666361172993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,768,0.0041759999261962045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,1024,0.02574666672282749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,1024,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,512,0.003531555748648114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,768,0.023984000086784363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,512,0.012331555287043253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,3072,128,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,256,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,7168,0.04584088921546936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,128,0.003228444399105178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,256,0.02275111112329695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,64,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,128,0.01922044489118788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,32,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,64,0.011767999993430244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,32,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,65536,0.05530844463242424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,2048,0.013785777820481194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,65536,0.12473244137234157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,51200,0.04387377699216207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,16384,0.019879110985332064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,51200,0.10024355517493354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,768,0.012456888953844706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,12288,0.0166275550921758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,16384,0.07654222514894274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,51200,0.1894071102142334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,12288,0.029807110627492268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,12288,0.06220177809397379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,10240,0.02699111070897844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2560,128,0.011364444262451597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,10240,0.05613778034845988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,8192,0.024375110864639282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,8192,0.05009599857860141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,7168,0.013573333621025085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,7168,0.0455022222465939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,7168,0.02091288897726271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,6144,0.012720888687504662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,6144,0.01955200069480472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,6144,0.04225688841607836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,5120,0.010430222584141625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,65536,0.2362142139010959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,4096,0.009053332938088311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2560,256,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,5120,0.018236445056067575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,4096,0.03525688913133409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,4096,0.016220443778567843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,3584,0.008282666405042013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,3584,0.01517511076397366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,3072,0.007983999947706858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,8192,0.014694222145610385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,3072,0.01460977726512485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,3072,0.03088266650835673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,2560,0.006853333363930385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,2560,0.014144000079896716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,2560,0.029130667448043823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,2048,0.005538666827811136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,2048,0.013471999930010902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,2048,0.02842666705449422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,1536,0.004877333425813251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,1536,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2560,512,0.024375999967257183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,1024,0.004231111043029361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,1024,0.0247013337082333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,1024,0.012776888906955719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,10240,0.015839111473825242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,768,0.0041706665522522396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,512,0.0034844444857703317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,768,0.023361777265866596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,3584,0.03207022282812331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,256,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,512,0.012372444073359171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,512,0.023324444890022278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,128,0.003148444410827425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,256,0.02281155520015293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,256,0.011761777930789523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,64,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,128,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,128,0.020289777053727042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,2048,32,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,64,0.011420444481902652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,65536,0.04532355401251051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,32,0.011762667033407422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,51200,0.0362044440375434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,65536,0.11904356214735244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,1536,0.025757332642873127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,16384,0.036679999695883855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,16384,0.01663733356528812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,51200,0.09808266825146145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,65536,0.23477511935763887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,12288,0.014096889230940076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,16384,0.03587199913130866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,16384,0.07622222105662028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,51200,0.18774755795796713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,10240,0.015096000499195524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,12288,0.02920177910063002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,8192,0.014928888943460254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,2048,768,0.012479110724396177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,10240,0.055776887469821505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,7168,0.012464000119103326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,8192,0.04934933450486925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,8192,0.02348533272743225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,6144,0.011327111058764987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,7168,0.04337066743108961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,7168,0.02079288827048408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,5120,0.009763555394278632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,6144,0.01832266648610433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,6144,0.04207999838723076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,4096,0.008667555948098501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,5120,0.01752088963985443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,5120,0.03683822353680929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,3584,0.00794488853878445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,4096,0.01643111142847273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,4096,0.033598221010631986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,3072,0.0069724445541699724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,3584,0.03155555658870273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,3584,0.015383111106024848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,2560,0.006265777680608962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,3072,0.014519110321998596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,3072,0.030821333328882854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,2048,0.0052577778697013855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,2560,0.014122666584120857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,2048,5120,0.037026666932635836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,1536,0.004910222358173794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,2048,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,1024,0.0041982221106688184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,1536,0.013071999781661563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,1024,0.012437333663304647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,768,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,1024,0.024732444021436904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,10240,0.02662311163213518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,512,0.0035617777870761026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,768,0.024687111377716064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,768,0.012367111113336353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,256,0.0031999999450312722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,512,0.02296888828277588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,512,0.01204177737236023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,128,0.0029475556479560006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,256,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,256,0.022336888644430373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,128,0.019595555133289762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,128,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1536,32,0.002871111035346985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,64,0.01127644462717904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1536,32,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,65536,0.033824000093672014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,2560,0.028929776615566675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,51200,0.027095110880004034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,65536,0.11877244048648411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,1536,0.027090667022599116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,16384,0.013445333474212222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,65536,0.23505422804090711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,12288,0.06211555666393704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,51200,0.09377777576446533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,12288,0.014917333920796713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,51200,0.18831200069851348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,16384,0.03547733359866672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,12288,0.028660443094041612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,10240,0.01349244432316886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,12288,0.06167822413974338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,8192,0.012132444315486483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,10240,0.05509777863820394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,10240,0.025693333811230127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,7168,0.011695110963450538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,8192,0.047641777329974704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,6144,0.010699555277824402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,7168,0.019926221834288705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,7168,0.04334933227962918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,5120,0.009323555562231276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,6144,0.01850488947497474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,6144,0.040651556518342756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,4096,0.008205333517657386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,5120,0.017151999804708693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,5120,0.03674044542842441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,3584,0.011408000356621213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,4096,0.03313333458370633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,4096,0.015875554747051664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,3072,0.010326222413116032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,3584,0.015205333630243937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1536,2048,0.027739556299315557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,2560,0.008671999805503422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,3072,0.030517333083682593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,3072,0.014560888210932413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,2048,0.007916444705592262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,2560,0.013778666655222574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,1536,0.004889777965015835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,2048,0.027464888162083093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,16384,0.07555822531382243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,1536,0.012808000048001608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,1024,0.004309333446953031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,1024,0.024678222007221643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,1024,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,768,0.003909333298603694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,768,0.024689777029885188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,768,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,512,0.0035075553589397003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,512,0.011895111037625207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,256,0.00318755561278926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,3584,0.03155733479393853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,256,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,128,0.002951111023624738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,256,0.02196088929971059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,2560,0.02954044606950548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,2048,0.013463111387358772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,64,0.0029208889851967492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,128,0.01959911154376136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,1024,32,0.0028888889484935333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,65536,0.025952888859642878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,1536,0.025752888785468206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,64,0.011778666741318174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,32,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,51200,0.022708444131745234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,65536,0.11699199676513672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,8192,0.022069333328141108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,16384,0.014575999644067554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,51200,0.09235466851128472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,12288,0.012498666842778524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,65536,0.23494132359822592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,51200,0.18911733892228869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,10240,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,16384,0.03517599900563558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,16384,0.07563733392291598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,8192,0.011333333121405708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,12288,0.02792000108295017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,12288,0.06138755877812704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,7168,0.010877333581447601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,10240,0.024756444825066462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,10240,0.055148445897632174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,6144,0.009702222214804756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,8192,0.04725955592261421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,7168,0.019832000136375427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,5120,0.00941422250535753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,6144,0.04009066687689887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,5120,0.03611200054486593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,1024,128,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,4096,0.008003555238246918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,4096,0.033260444800059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,4096,0.01579466627703773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,3584,0.007630222373538547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,3584,0.01515111161602868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,3584,0.03177777926127116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,3072,0.0062773335311147906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,3072,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,3072,0.03048000070783827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,1024,512,0.02285066743691762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,2560,0.005619555711746216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,8192,0.02276800076166789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,2048,0.0053688887920644544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,2560,0.02913155489497715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,2560,0.013797333670987023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,1536,0.004854222138722737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,6144,0.018547554810841877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,2048,0.027489778068330552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,1024,0.004192000048028098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,1536,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,5120,0.017204445269372728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,1536,0.026347556047969397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,768,0.0038613333470291565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,512,0.0032311110860771606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,1024,0.012435555458068848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,768,0.024342222346199885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,768,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,256,0.0031991110493739447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,512,0.01183199965291553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,512,0.023021333747439917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,128,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,256,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,256,0.022674666510687932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,64,0.0027822222974565295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,768,32,0.002801777794957161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,128,0.01146755533085929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,65536,0.028304888142479792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,64,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,32,0.011347555451922946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,51200,0.023971555961502924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,65536,0.11554577615525986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,65536,0.23516533109876844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,51200,0.09175022443135579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,16384,0.016531555189026725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,51200,0.1881413327323066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,768,2048,0.013569778038395775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,12288,0.01165244479974111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,16384,0.03425866696569655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,10240,0.01037333326207267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,12288,0.060771558019849986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,12288,0.02776622275511424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,1024,0.024060444699393377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,8192,0.009287999735938178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,10240,0.05442400111092461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,7168,0.008298666940795051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,8192,0.04682577649752299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,8192,0.021781333618693884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,6144,0.008316444853941599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,128,0.019555555449591745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,7168,0.042944888273874916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,5120,0.007658667034573025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,6144,0.01852799952030182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,6144,0.039919111463758684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,4096,0.007655999726719326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,5120,0.03599822190072801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,5120,0.017200888858901132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,3584,0.007636444436179266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,4096,0.015807110402319167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,4096,0.032905777295430504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,3072,0.006576889091067844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,3584,0.015154666370815702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,768,7168,0.04305511050754123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,2560,0.005953777581453323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,3072,0.014461333552996317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,3072,0.03089244498146905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,16384,0.0748622218767802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,2048,0.005221333354711533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,2560,0.014099554883109199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,1536,0.00452888881166776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,2048,0.02814399864938524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,2048,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,10240,0.024312888582547505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,1024,0.0038782221575578055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,1536,0.013101333545313941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,768,0.0035439998739295532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,1024,0.024716445141368445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,768,0.012119111087587146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,7168,0.0195795562532213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,768,0.02438933319515652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,512,0.0032319999817344877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,256,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,512,0.024106666445732117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,512,0.011925333076053195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,256,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,256,0.02267733381854163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,128,0.01164533363448249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,128,0.020234665936893888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,3584,0.031340443425708346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,32,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,64,0.011695110963450538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,65536,0.01924533314175076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,32,0.011071110765139261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,2560,0.028720001379648846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,51200,0.016187555260128446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,65536,0.11389777395460342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,512,1536,0.027104000250498455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,51200,0.08904533253775702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,512,1024,0.012411555482281579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,51200,0.18853155771891275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,16384,0.03286222285694546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,12288,0.008990222381220924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,16384,0.07401600148942736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,128,0.0028862222615215513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,10240,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,12288,0.027048889133665297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,8192,0.010990222295125326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,12288,0.05924089087380303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,10240,0.05271288752555847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,512,64,0.002487999904486868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,10240,0.02405511173937056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,7168,0.010416888528399997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,8192,0.02160800000031789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,8192,0.04685866501596239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,7168,0.04277333286073473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,7168,0.019811555743217468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,5120,0.00811822215716044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,6144,0.040143112341562905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,6144,0.01824711097611321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,4096,0.007650666766696506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,5120,0.017179555363125272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,5120,0.035946667194366455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,3584,0.007263999846246507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,4096,0.015513777732849121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,4096,0.033040000332726374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,3072,0.007234666910436418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,3584,0.014767110347747803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,3584,0.032227555910746254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,16384,0.009679111341635386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,2560,0.0058871110280354815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,3072,0.014230221509933472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,2048,0.004885333279768626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,2560,0.029488000604841445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,2560,0.0140364451540841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,1536,0.004543999830881755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,2048,0.027387556102540758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,2048,0.013400000002649097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,1024,0.0038311113086011675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,1536,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,1536,0.027095110880004034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,768,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,1024,0.01237155579858356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,1024,0.023997333314683702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,512,0.003436444534195794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,768,0.01242844429281023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,768,0.02404622236887614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,256,0.0031946665710873077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,512,0.023149333066410486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,128,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,6144,0.007672000262472365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,256,0.02299733294381036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,64,0.0025519999778932994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,128,0.01887911061445872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,128,0.011343999869293638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,256,32,0.002530666689078013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,65536,0.014936000108718872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,64,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,32,0.011051555474599203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,51200,0.013389333254761167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,65536,0.11216889487372504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,3072,0.030504888958401147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,51200,0.08813066614998712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,16384,0.009712888962692684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,51200,0.18847200605604383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,16384,0.032568001084857516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,12288,0.008640000389681922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,16384,0.07278755638334486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,10240,0.009027555584907532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,12288,0.02702399922741784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,12288,0.05885510974460178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,8192,0.00829777783817715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,10240,0.0239982224173016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,512,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,10240,0.05243733194139269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,7168,0.008018666671382057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,8192,0.02125866711139679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,8192,0.04697688751750522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,6144,0.007657777931955125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,7168,0.019294222195943195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,7168,0.04242222176657783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,5120,0.007305777735180325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,6144,0.018211555149820115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,6144,0.03942044576009115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,4096,0.006788444601827198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,5120,0.016499555773205228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,3584,0.006574222197135289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,4096,0.015185778339703878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,256,65536,0.23587822914123535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,3072,0.005954666684071223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,65536,0.2351564566294352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,3584,0.014488000008794995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,3584,0.03092355529467265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,2560,0.006633777585294511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,3072,0.014141332772043018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,3072,0.031197332673602637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,2048,0.005949333310127258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,2560,0.013423999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,2560,0.02847644355561998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,1536,0.004361777669853634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,2048,0.013461333182122974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,2048,0.027411555250485737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,1024,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,1536,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,1536,0.027107555005285475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,768,0.003535110917356279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,1024,0.01221244451072481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,1024,0.024688000480333965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,256,256,0.011777777638700275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,768,0.0233262214395735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,768,0.012411555482281579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,256,0.0031902222997612427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,512,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,512,0.023315555519527856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,128,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,256,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,5120,0.03563466668128967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,256,0.02239911092652215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,64,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,32,0.002620444529586368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,4096,0.03355111016167535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,128,0.011014222270912595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,160,128,128,0.01958311100800832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,65536,0.015145777000321282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,51200,0.014183999763594734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,64,0.011689778003427716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,16384,0.008994667066468133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,128,32,0.011003555523024665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,12288,0.007996444072988298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,10240,0.007337777978844113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,65536,0.11125155289967854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,51200,0.08476710981792873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,16384,0.03288799855444167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,8192,0.007279111279381647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,12288,0.026920888159010146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,7168,0.006639110959238476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,10240,0.02426044477356805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,6144,0.006618666566080517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,5120,0.006279110908508301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,8192,0.021456888980335657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,7168,0.0195777780479855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,4096,0.005949333310127258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,6144,0.018197332819302876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,3584,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,3072,0.005976888868543837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,5120,0.016819554898473952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,2560,0.006235555642180973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,4096,0.01551999979548984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,3584,0.015142222245534262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,2048,0.006163555714819167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,1536,0.004232888834344016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,3072,0.014111111561457316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,1024,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,128,512,0.003144888828198115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,768,0.003527111063400904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,2560,0.013458666702111563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,512,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,2048,0.013423110875818463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,256,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,128,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,1536,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,1024,0.012390221986505719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,64,0.0025315555847353404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,768,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,64,32,0.002483555633160803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,512,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,256,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,65536,0.014152000347773233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,128,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,16384,0.008296888735559251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,64,0.011742221812407175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,64,32,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,12288,0.007264888948864407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,10240,0.007282666862010956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,65536,0.10690933465957642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,8192,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,51200,0.08494755294587876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,7168,0.006642666541867786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,12288,0.026758222116364375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,10240,0.02401422295305464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,6144,0.006252444452709622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,5120,0.006008000009589725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,8192,0.021362667282422382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,4096,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,7168,0.019229332605997723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,3584,0.0064604443808396654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,6144,0.018226666582955253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,5120,0.016992888516849942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,3072,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,2560,0.006593777901596493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,4096,0.015508444772826301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,2048,0.006250666661394968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,3584,0.014495111174053617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,1536,0.00424177779091729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,3072,0.01447111037042406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,1024,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,768,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,2048,0.013352000051074557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,1536,0.012758221891191272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,512,0.0031866667171319327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,1024,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,256,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,768,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,128,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,512,0.012042666474978128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,64,0.002628444383541743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,256,0.01178311142656538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,32,0.002513777878549364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,128,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,64,0.011477332976129321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,160,32,51200,0.012076444096035428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,32,0.011748444702890186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,16384,0.03256977929009332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,16384,0.33751644028557676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,16384,0.2838835451338026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,12288,0.25792709986368817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,160,32,2560,0.013452444639470843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,10240,0.21375021669599745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,12288,0.2133235534032186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,10240,0.18142578336927626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,8192,0.17637244860331217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,51200,0.870306650797526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,51200,1.0444960064358182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,7168,0.15518044100867376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,8192,0.14887555440266928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,6144,0.13326666090223524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,7168,0.12913421789805093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,4096,0.09659822119606866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,3584,0.0820888876914978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,6144,0.11248355441623265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,5120,0.09570311175452338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,3072,0.07226755883958605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,2560,0.06070399946636624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,3584,0.07127110825644599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,2048,0.0508266654279497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,3072,0.06305688619613647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,1536,0.03944977786805894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,2560,0.056164443492889404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,1024,0.028982222080230713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,1536,0.040299554665883384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,768,0.02325600054528978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,2048,0.048735111951828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,512,0.016141333513789706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,1024,0.03307822346687317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,256,0.010684444672531553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,128,0.008653333617581261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,768,0.040066666073269315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,64,0.00793688909875022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,256,0.022610666023360357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,128,0.021202666891945735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,32,0.007968000239796108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,64,0.02124711043304867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,32,0.0210533340771993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,4096,0.0796711113717821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,16384,0.2866017818450928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,51200,0.6951368649800619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,51200,0.8889697392781576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,65536,0.9075359768337674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,65536,512,0.02976622184117635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,65536,1.1291475296020508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,16384,0.22957777976989746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,12288,0.21863199604882133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,10240,0.19814577367570665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,65536,5120,0.1133155557844374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,10240,0.1475315491358439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,8192,0.12183554967244466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,7168,0.14288711547851562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,8192,0.1623484426074558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,6144,0.12283378177218968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,12288,0.1733671161863539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,6144,0.09260533253351848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,4096,0.08447911341985066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,5120,0.10352000263002183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,3584,0.0742595526907179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,3072,0.06489777565002441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,2560,0.05421688821580675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,5120,0.07923377884758843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,3584,0.059843553437127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,2048,0.04442844457096524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,3072,0.053267555104361645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,2560,0.04756800002521939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,1024,0.02597066594494714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,2048,0.04108533263206482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,768,0.01920088960064782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,1536,0.034635557068718806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,512,0.013855111267831592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,1536,0.03504000107447306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,256,0.009746666583749983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,1024,0.02881066666709052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,4096,0.0663964417245653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,768,0.03229422370592753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,64,0.005562666803598404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,512,0.02606044378545549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,256,0.020281778441535104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,128,0.018932445181740653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,64,0.01888088881969452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,32,0.019923556182119582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,51200,0.2660951084560818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,65536,0.35159733560350204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,16384,0.08890755308998956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,51200,0.2763813336690267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,12288,0.07071110937330458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,10240,0.05712888638178507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,16384,0.09535466962390476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,12288,0.07498577568266127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,8192,0.04883644315931532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,7168,0.04201511210865445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,10240,0.06493422057893541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,8192,0.05349599983957079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,6144,0.03664888938268026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,5120,0.03183022141456604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,7168,0.04731288883421156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,128,0.006698666761318843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,4096,0.02737688852681054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,51200,32,0.005895111295912001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,6144,0.04267999860975477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,3584,0.02381155557102627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,5120,0.03764444589614868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,3072,0.02090488870938619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,2560,0.01756355497572157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,2048,0.014692443940374585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,3584,0.029947555727428857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,3072,0.02662044432428148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,1536,0.01180622229973475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,2560,0.02476088868247138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,1024,0.009457777771684859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,768,0.007986666427718269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,2048,0.02204533252451155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,512,0.006506666541099548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,1536,0.019596444235907663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,1024,0.017816889617178176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,256,0.00452622233165635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,128,0.003899555653333664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,768,0.019221333993805777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,64,0.003548444559176763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,512,0.016210666961140104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,256,0.014473777678277759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,32,0.004200889004601372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,128,0.013771555489963956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,64,0.014094221923086377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,32,0.014807111687130399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,65536,0.27618310186598033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,51200,0.21476356188456217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,65536,0.2654995653364393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,16384,0.07373866770002577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,12288,0.05635199944178263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,10240,0.04701155424118042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,12288,0.05926311016082764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,16384,0.07422133286794026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,8192,0.04047466648949517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,16384,4096,0.032582223415374756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,7168,0.03476622369554307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,8192,0.04276444514592489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,6144,0.030144890149434406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,7168,0.038089778688218855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,5120,0.02630133264594608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,16384,65536,0.33751556608412003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,4096,0.02288088864750332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,6144,0.03458222084575229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,3584,0.01959288948112064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,5120,0.030879110097885132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,3072,0.01722400055991279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,2560,0.014709333578745524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,4096,0.026463111241658527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,3584,0.024344889654053584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,3072,0.02256977723704444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,2048,0.01276088919904497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,1536,0.010696888797812991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,2560,0.02123022245036231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,2048,0.019553777244355943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,1536,0.018197332819302876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,1024,0.015508444772826301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,512,0.005683555371231503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,51200,0.21047288841671416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,768,0.017208000024159748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,256,0.004547555413511065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,128,0.003933333274390963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,512,0.015127110812399121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,256,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,64,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,32,0.0037768888804647657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,128,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,10240,0.05192177825503879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,64,0.013242666920026144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,51200,7168,0.10516444179746841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,12288,32,0.013080000049538083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,16384,0.07047200202941895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,65536,0.2666230996449788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,51200,0.20947110652923584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,65536,0.2547057734595405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,51200,0.20096000035603842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,12288,0.05495288968086243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,16384,0.07182488838831584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,10240,0.04602577620082431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,8192,0.03868888815244039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,1024,0.008838222258620793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,7168,0.03422755665249295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,6144,0.029841777351167467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,10240,0.05041422115431892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,8192,0.04139466749297248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,5120,0.02568799919552273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,12288,768,0.007699555820888943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,7168,0.036943111154768206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,4096,0.02179644505182902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,3584,0.018966222802797954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,3072,0.016881777180565726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,5120,0.028805332051383123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,2560,0.014472888575659858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,3584,0.02381422287887997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,4096,0.025621333056026038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,2048,0.012689777546458773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,3072,0.022439110610220168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,1536,0.010657777388890585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,1024,0.008600888980759515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,2560,0.02072622213098738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,2048,0.019154666198624503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,768,0.006909333169460297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,512,0.005919111271699269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,1536,0.017703110973040264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,1024,0.015053333507643806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,256,0.004878222114510006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,768,0.016540444559521146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,128,0.0038684445122877755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,64,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,512,0.01462044484085507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,256,0.01312444441848331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,10240,32,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,128,0.012961777547995249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,64,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,32,0.012125333150227865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,65536,0.19463466273413765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,51200,0.15151377518971762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,16384,0.0520666672123803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,12288,0.057110223505232066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,65536,0.21182666884528267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,12288,0.04117244482040405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,51200,0.16856711440616182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,10240,0.03418044580353631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,10240,6144,0.033547557062572904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,8192,0.029319110843870375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,12288,0.04934755629963345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,16384,0.061166220241122775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,10240,0.04338666796684265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,7168,0.025356445047590468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,5120,0.01925155520439148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,6144,0.022271111607551575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,4096,0.016710221767425537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,8192,0.035284443034066096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,6144,0.02827199962404039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,3072,0.01310755560795466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,2560,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,4096,0.022665777140193518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,5120,0.025433777107132807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,3584,0.021319111188252766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,3072,0.020259555843141343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,1536,0.008619555168681675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,1024,0.00656444455186526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,2560,0.01923199991385142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,2048,0.017516444126764934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,768,0.005554666535721884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,1536,0.016235555211702984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,512,0.004537777768241035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,1024,0.014364444547229342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,768,0.01550044450494978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,128,0.003489777859714296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,512,0.014479999740918478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,256,0.012817777693271637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,128,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,32,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,64,0.012228444218635559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,32,0.012229333321253458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,65536,0.16539733939700657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,8192,7168,0.03196000059445699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,51200,0.1326568921407064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,3584,0.014319111903508505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,16384,0.049908445941077344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,65536,0.2079955604341295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,2048,0.01032266683048672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,12288,0.03928177886539035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,16384,0.060191108120812305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,51200,0.16465955310397679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,10240,0.03293244375122918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,12288,0.048446221484078296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,8192,0.028173334068722192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,7168,0.024780443973011438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,6144,0.02169955604606205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,10240,0.041913777589797974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,256,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,8192,0.03455288873778449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,5120,0.018509333332379658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,7168,0.030647112263573542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,4096,0.015850666496488783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,6144,0.02774488925933838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,3072,0.012960000170601739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,8192,64,0.0035377778112888336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,5120,0.024917332662476435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,2560,0.011115555961926779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,4096,0.022626666559113398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,2048,0.009705777797434065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,3584,0.021274665991465252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,1536,0.008477333519193862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,3072,0.020047111643685233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,1024,0.006326222171386083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,768,0.005222222043408289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,2560,0.018906666172875296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,2048,0.01721244388156467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,512,0.004569777597983678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,1024,0.014095111025704278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,256,0.0036319999231232535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,128,0.0035333335399627686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,768,0.015275556180212231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,64,0.0031999999450312722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,512,0.013774221969975365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,32,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,256,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,128,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,64,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,32,0.013810666898886362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,65536,0.1518053346210056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,51200,0.11993332703908284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,16384,0.04720800121625265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,65536,0.17076888349321154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,12288,0.03362311257256402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,51200,0.13467466831207275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,10240,0.030068443881140813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,16384,0.05095022254519992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,8192,0.024531554844644334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,7168,0.021686222818162706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,12288,0.04118577639261881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,6144,0.019519110520680744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,10240,0.03524177935388353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,8192,0.029481778542200725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,5120,0.01689511040846507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,7168,0.02605688903066847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,4096,0.014751111467679342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,7168,3584,0.01388088862101237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,3584,0.012702222499582501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,6144,0.024155555499924555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,3072,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,2560,0.00981244444847107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,4096,0.0199297782447603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,2048,0.008965333302815756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,3584,0.019126221537590027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,3072,0.018236445056067575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,1536,0.007594666547245449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,1024,0.005892444401979446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,2560,0.017163554827372234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,2048,0.015480000111791821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,768,0.004884444591071871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,512,0.004222222086456087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,1536,0.014462222655614218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,1024,0.01348888874053955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,256,0.0035439998739295532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,128,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,64,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,512,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,6144,32,0.0032044444233179092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,256,0.01239377756913503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,128,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,64,0.011927111281288994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,32,0.013085333009560903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,51200,0.09682399696773952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,65536,0.1656951109568278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,16384,0.03858933183881972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,12288,0.03392088744375441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,51200,0.13139111465877956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,16384,0.04945688777499729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,10240,0.02796799937884013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,12288,0.03853066762288412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,10240,0.03349511159790887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,5120,0.022295110755496558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,8192,0.028452446063359577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,6144,0.01878666712178124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,7168,0.025834666358100042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,5120,0.015792000624868605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,7168,1536,0.01581333412064446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,4096,0.01351111133893331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,6144,768,0.014471999473041959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,5120,0.02197066611713833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,3584,0.01201866649919086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,3072,0.010783111055692038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,4096,0.02013511127895779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,2560,0.009637333452701569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,65536,0.11923021740383571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,3584,0.019149333238601685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,2048,0.008641777767075432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,3072,0.017549332645204332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,1536,0.007017778025733099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,2560,0.016511110795868766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,2048,0.015164444843928019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,1536,0.014487110906177096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,1024,0.013410666750537025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,512,0.004048000193304486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,8192,0.023913777536816064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,256,0.003666666646798452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,512,0.01309333327743742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,7168,0.021078222327762183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,128,0.0031893334041039148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,256,0.012390221986505719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,64,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,128,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,32,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,6144,0.02402044501569536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,65536,0.1046782202190823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,32,0.012072888513406118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,51200,0.08422933022181193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,65536,0.1597075594796075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,1024,0.005605333381228977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,16384,0.03410133388307359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,51200,0.12750844160715738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,5120,768,0.004563555535342959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,12288,0.027793778313530818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,10240,0.02199199961291419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,16384,0.046625776423348315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,8192,0.018823110395007663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,12288,0.03653066688113742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,768,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,7168,0.016536888149049547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,6144,0.014236445228258768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,10240,0.032872888776991106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,5120,0.012706666356987424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,8192,0.02753777801990509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,4096,0.011331555744012197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,7168,0.025311999850802954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,5120,0.021548445026079815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,3072,0.00853777759604984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,3584,0.01852799952030182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,5120,64,0.012030222349696688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,2560,0.007680888805124495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,3072,0.016515556308958266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,2048,0.006631999793979857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,1536,0.005255110975768831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,2560,0.015818667080667283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,1024,0.004536889079544279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,1536,0.014101333088344999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,768,0.0041999999019834726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,1024,0.013368888861603208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,512,0.0038684445122877755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,256,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,768,0.013779555757840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,128,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,512,0.013060444758998023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,64,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,256,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,32,0.0032319999817344877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,128,0.011940444509188334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,64,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,65536,0.08612089024649726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,32,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,4096,3584,0.009754666851626502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,51200,0.07163466347588433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,4096,0.019820445113711886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,16384,0.0336791111363305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,65536,0.15632711516486272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,51200,0.12618311246236166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,12288,0.026797332697444495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,10240,0.023615999354256526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,16384,0.045455111397637256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,8192,0.017157332764731515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,12288,0.03633244501219855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,7168,0.015442666080262927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,10240,0.032292445500691734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,8192,0.027284445034133062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,2048,0.014800000521871777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,5120,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,7168,0.025053333905008104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,4096,0.010953777366214328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,6144,0.023132445083724126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,3584,0.00962311112218433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,3072,0.008956444760163626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,5120,0.02124622298611535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,2560,0.007260444263617198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,4096,0.01904622217019399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,2048,0.006235555642180973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,3584,0.017285333739386666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,1536,0.005551110953092575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,3072,0.016536000702116225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,1024,0.004511111312442356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,2560,0.015750222735934787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,768,0.0042088888585567474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,512,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,1536,0.014104000396198697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,1024,0.013427555561065674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,256,0.0035217776894569397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,768,0.013429332938459186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,128,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,512,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,64,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,32,0.0028906667398081887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,256,0.012527999778588613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,128,0.011613333390818702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,64,0.011748444702890186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,4096,6144,0.023431999815834895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,65536,0.07598400115966797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,32,0.01126933346192042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,51200,0.06204977962705824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,16384,0.02641511129008399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,12288,0.02237244447072347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,65536,0.118487106429206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,10240,0.018906666172875296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,51200,0.09606489208009507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,12288,0.029002666473388672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3584,6144,0.013780444032616086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,10240,0.026145777768558923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,7168,0.013785777820481194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,8192,0.022686221533351477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,6144,0.012076444096035428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,5120,0.011056889262464313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,7168,0.020937777227825586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,4096,0.010199999643696679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,6144,0.019913777709007263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,5120,0.017927999297777813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,3584,0.009024889104896123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,3072,0.008278222547637092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3584,2048,0.01477688882086012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,4096,0.015815999772813585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,2560,0.007910221815109253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,2048,0.0068959999415609576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,3584,0.015781333049138386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,1536,0.005884444548024072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,2560,0.014455111490355598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,1024,0.004547555413511065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,2048,0.013757333159446716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,768,0.0042239998777707415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,1536,0.013403555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,512,0.003625777860482534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,1024,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,256,0.003524444583389494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,768,0.013373333546850415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,128,0.0031946665710873077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,512,0.01275022245115704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,16384,0.035319109757741295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,64,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,32,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,256,0.011777777638700275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,3072,8192,0.015800888339678448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,128,0.011419555379284753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,65536,0.0669742226600647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,64,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,51200,0.054303109645843506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,32,0.011746666497654386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,16384,0.024505777491463557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,12288,0.020845333735148113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,65536,0.11671200063493516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,10240,0.018173333671357896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,8192,0.014091556270917257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,51200,0.09326666593551636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,16384,0.033928000264697604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,12288,0.02819377846188015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,7168,0.013250666360060373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,6144,0.011345778074529437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,10240,0.025632888078689575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,5120,0.01032977799574534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,8192,0.02218222286966112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,7168,0.020622221959961783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,3584,0.008630221916569604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,3072,0.00775999989774492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,5120,0.017285333739386666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,4096,0.01568622224860721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,2560,0.007280888656775157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,3072,3072,0.014816888504558139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,3584,0.015114666687117683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,2048,0.006052444378534953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,1536,0.005202666752868229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,3072,0.01460000044769711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,1024,0.00444444434510337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,768,0.0038728887836138406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,2560,0.014089778065681458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,2048,0.013731555806265937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,1536,0.013139555851618448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,512,0.0036159998012913596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,256,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,1024,0.01275288893116845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,128,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,768,0.013056000073750814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,64,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,512,0.01275199982855055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,32,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,256,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,128,0.011719110939237805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,65536,0.05647022194332547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,64,0.011396444506115384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,32,0.011792889071835412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,51200,0.046441776884926685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,16384,0.019927110936906602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,12288,0.016480889585283067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,65536,0.11269511116875543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,10240,0.014560888210932413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,8192,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,16384,0.03322311242421468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,12288,0.027895109521018133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,7168,0.01311644415060679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,10240,0.025432000557581585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,6144,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,5120,0.010034666293197209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,8192,0.021659556362364028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,7168,0.020052444603708055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,4096,0.008911111288600499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2560,4096,0.009296000003814697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,6144,0.018601778480741713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2560,6144,0.01938222183121575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,5120,0.01720355616675483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,3072,0.007584888901975419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,4096,0.01548266741964552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,2560,0.006576889091067844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,2048,0.0058986664646201665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,3584,0.014829332629839579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,1536,0.005215999980767568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,3072,0.014752000570297241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,2560,0.014091556270917257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,1024,0.0042204442951414315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,768,0.0038782221575578055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,2048,0.013418667018413544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,512,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,1536,0.01308444473478529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,256,0.0032213332338465583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,768,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,128,0.0029680000411139596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,512,0.012169777519173093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,64,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,256,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,32,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,128,0.011764444410800934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,64,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,65536,0.04524622360865275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,32,0.011389333340856763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,51200,0.09126133388943142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,51200,0.03595111105177138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,16384,0.017835555805100333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,12288,0.014767999450365702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,51200,0.08837955527835423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,16384,0.03292266527811686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,10240,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,2048,3584,0.0079644446571668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,8192,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,12288,0.027787556250890095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,7168,0.014322666658295525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,10240,0.025377778543366328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,6144,0.012636444634861417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,5120,0.009986666341622671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,8192,0.02130844526820713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,4096,0.008619555168681675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,7168,0.019664888580640156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,3584,0.007879111501905654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,6144,0.017934223016103108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,3072,0.007182222273614671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,4096,0.015452444553375244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,2560,0.006230222268237009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,3584,0.015103111664454142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,2048,0.005533333453867171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,3072,0.014525334040323893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,1536,0.00489688871635331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,2560,0.014149333039919535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,1024,0.004201777693298128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,1536,0.013219555219014486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,768,0.0038977778620190094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,1024,0.012463111016485425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,768,0.01276177747382058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,256,0.0033128888656695685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,65536,0.10986577802234226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,512,0.01222222215599484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,128,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,64,0.0028844444702068963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,256,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1536,32,0.002973333415057924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,128,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,64,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,65536,0.032792889409595065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,51200,0.02681866619322035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,32,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,16384,0.01479200025399526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,12288,0.013080000049538083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,5120,0.016536000702116225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,51200,0.08506488800048828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,65536,0.10628889004389445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,16384,0.03249866763750712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,10240,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,8192,0.010843555960390302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,2048,1024,0.012520000338554382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,7168,0.010293333066834344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,12288,0.026749332745869953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,6144,0.009979555176364051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,5120,0.009654222263230218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,10240,0.024292444189389546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,4096,0.007997333175606197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,7168,0.01889333294497596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,3584,0.007436444362004598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,6144,0.01759199963675605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,3072,0.006594666590293248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1536,2048,0.013449778159459433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,2560,0.006010666489601135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,4096,0.01516533394654592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,2048,0.005294222384691238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,3584,0.014485332700941296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,1536,0.004579555657174853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,3072,0.014114666316244336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,1024,0.0041786668201287585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,2560,0.014093332820468478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,768,0.0038924444880750445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,2048,0.013432000246312885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,1536,0.012793777717484368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,512,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,1024,0.012396444049146442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,256,0.0032231110251612137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,768,0.012381333443853589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,128,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,64,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,512,0.012088889049159156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,256,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,1024,32,0.0028000000036425064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,128,0.011485333244005838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,64,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,65536,0.02917155623435974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,51200,0.02432800001568264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,32,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,16384,0.012074666718641916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,12288,0.011122666299343109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,51200,0.08385155598322551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,10240,0.010663111176755695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,16384,0.03201155530081855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,8192,0.009670221971140968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,12288,0.026770666241645813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,7168,0.01071466671095954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,10240,0.023034666975339253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,8192,0.01997155613369412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,6144,0.009530666801664565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,8192,0.019919999771647982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,5120,0.008656889200210571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,4096,0.008014221986134848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,7168,0.01889244384235806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,6144,0.017904000149832833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,3584,0.007661333514584436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,5120,0.016536000702116225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,3072,0.006312888943486744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,2560,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,4096,0.01517688896920946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,2048,0.0052639999323421055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,3584,0.0148026661740409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,3072,0.014119111829333834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,2560,0.014106666048367819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,1024,0.0041786668201287585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,2048,0.01312888910373052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,768,0.0036186666952239144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,1536,0.012748444245921241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,512,0.0033324443631701996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,1024,0.012468444804350534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,256,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,768,0.012461333639091916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,128,0.003024000053604444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,512,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,64,0.0026524443593290118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,65536,0.10490044620301987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,256,0.011753777662913004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,32,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,128,0.011409777734014722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,65536,0.024135111106766596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,64,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,51200,0.01957244508796268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,16384,0.013112000293201871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,65536,0.10254755285051133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,12288,0.01124888906876246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,51200,0.0818728870815701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,1024,5120,0.016522667474216886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,16384,0.030596445004145306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,10240,0.010008888940016428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,8192,0.00868622213602066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,7168,0.008294222255547842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,12288,0.025143999192449782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,10240,0.02294844388961792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,6144,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,8192,0.019786667492654588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,5120,0.008964444200197855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,768,1536,0.00461777796347936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,4096,0.007657777931955125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,3584,0.0069413334131240845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,6144,0.01756888959142897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,3072,0.006309333360857434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,2560,0.00592533333433999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,4096,0.015119999647140503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,3584,0.014487110906177096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,2048,0.0052355556852287715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,3072,0.014085332552591959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,1536,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,1024,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,2560,0.014136888914638095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,768,0.0038746665749284956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,2048,0.013148444394270578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,512,0.003621333175235324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,1536,0.01277599980433782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,256,0.002847111059559716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,1024,0.012383999923865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,768,32,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,512,0.012074666718641916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,256,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,64,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,32,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,128,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,64,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,65536,0.01978755493958791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,32,0.0107022225856781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,51200,0.016929777132140267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,65536,0.1009262204170227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,7168,0.018544000056054857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,16384,0.01014311114947001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,51200,0.0780808859401279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,12288,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,5120,0.01648177703221639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,10240,0.011072888970375061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,8192,0.010048000348938836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,16384,0.029923554923799302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,12288,0.025006221400366888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,7168,0.009460444251696268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,10240,0.02275466587808397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,8192,0.019733332925372653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,5120,0.008012444608741337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,6144,0.017515555024147034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,4096,0.0076142218377855085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,5120,0.016473778420024447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,3584,0.0069155556460221606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,512,128,0.0028453332682450614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,512,768,0.012445333103338877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,4096,0.014839111102951897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,2560,0.005910222315125995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,3584,0.014835556348164877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,2048,0.00488711107108328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,3072,0.014408000641398959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,1536,0.004536889079544279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,2560,0.013768889009952545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,1024,0.003914666672547658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,2048,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,768,0.003535110917356279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,1536,0.01312711089849472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,512,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,1024,0.012601777911186218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,256,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,768,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,128,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,512,0.012112889024946423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,64,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,256,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,32,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,6144,0.0086986662613021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,128,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,65536,0.015507555670208402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,64,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,7168,0.018439110782411363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,51200,0.013074666261672974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,16384,0.009685333404276106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,12288,0.009638222555319468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,65536,0.09884088569217259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,10240,0.009328888522254096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,51200,0.07697866360346477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,16384,0.02980088856485155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,8192,0.008359111017651027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,12288,0.02475022276242574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,7168,0.009366222553782994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,256,3072,0.006248000181383557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,6144,0.008301333420806462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,10240,0.02292888859907786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,5120,0.00869599978129069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,4096,0.007600888609886169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,7168,0.018230222993426852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,3584,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,6144,0.017511111166742113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,5120,0.016494222813182406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,4096,0.01517688896920946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,2560,0.00554666668176651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,2048,0.004878222114510006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,3584,0.014158222410413953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,3072,0.013841778039932251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,1536,0.00452622233165635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,2560,0.014126222994592456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,2048,0.013468444347381592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,768,0.003567999849716822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,1536,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,1024,0.01242844429281023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,768,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,256,0.002987555538614591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,512,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,128,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,256,32,0.011030221978823343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,256,0.011781333221329583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,128,0.01161688897344801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,65536,0.01519466605451372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,64,0.0107351111041175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,32,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,51200,0.013924444715181986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,16384,0.009020444419648912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,128,8192,0.01923288901646932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,65536,0.09873244497511123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,12288,0.009533333281675974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,51200,0.07653422488106622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,10240,0.008904000123341879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,16384,0.029800001117918227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,3072,0.006235555642180973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,8192,0.008010666403505538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,7168,0.008671999805503422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,12288,0.025060445070266724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,6144,0.008648888932334052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,10240,0.022290666898091633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,8192,0.01927199959754944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,5120,0.007721777591440413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,7168,0.018536888890796237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,4096,0.007258666886223688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,3584,0.006641777853171031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,5120,0.015809777710172866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,512,0.0032684444967243406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,3072,0.006251555350091722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,2560,0.006189333481921091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,3584,0.014208000567224292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,2048,0.005960888746711943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,3072,0.013883555928866068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,1536,0.004535111288229625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,2560,0.013415111435784234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,1024,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,2048,0.013068444199032254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,768,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,1536,0.0127368892232577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,512,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,1024,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,256,0.0028888889484935333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,768,0.01205599970287747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,128,0.0025475554996066624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,512,0.011737777955002256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,64,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,256,0.011385777758227454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,64,32,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,128,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,65536,0.027403554982609216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,64,0.011040888726711273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,32,0.010696888797812991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,128,1024,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,65536,0.09741333458158706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,16384,0.009302222066455418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,6144,0.01754133403301239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,12288,0.009355555805895064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,51200,0.07516622543334961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,10240,0.008960888617568547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,64,4096,0.014875556031862894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,16384,0.02962755494647556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,12288,0.025098666548728943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,7168,0.008968888885445064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,10240,0.022587555978033278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,6144,0.008515555825498369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,5120,0.007600888609886169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,8192,0.019540444016456604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,4096,0.007247111035717859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,7168,0.01891999940077464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,3584,0.006931555353932911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,6144,0.01716888944307963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,3072,0.006561777657932705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,2560,0.005962666538026597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,4096,0.01477777792347802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,2048,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,3584,0.015013333823945789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,3072,0.013747555514176687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,2560,0.013451555536852943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,1024,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,2048,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,1536,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,768,0.0034826666944556763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,512,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,1024,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,256,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,768,0.01205599970287747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,51200,0.022634666826989915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,128,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,64,0.00249422217408816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,256,0.011425777441925473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,32,0.00253866674999396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,128,0.011051555474599203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,64,0.010701333483060202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,8192,0.007711999946170383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,32,0.010665777656767102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,5120,0.015844444433848064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,16384,0.3761582109663222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,129,32,1536,0.004555555681387584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,51200,0.6618666648864746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,16384,0.22301067246331108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,12288,0.2789955668979221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,129,32,512,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,12288,0.16788889302147758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,51200,1.1479653252495658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,10240,0.23774933815002441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,10240,0.14257066779666477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,8192,0.19374933507707384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,8192,0.11938933531443278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,7168,0.17073244518703887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,7168,0.10228000084559123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,6144,0.14535289340549046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,12288,0.23361510700649687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,6144,0.08986044592327541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,8192,0.16341955131954616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,10240,0.19973956214057076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,5120,0.12323555681440566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,16384,0.3108542230394152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,5120,0.07677600118849012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,4096,0.10037599669562446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,7168,0.14436888694763184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,3584,0.08841244379679362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,4096,0.06454488966200086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,5120,0.11222310860951741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,6144,0.12824889024098715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,3072,0.07753777503967285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,3584,0.058747556474473744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,2560,0.06454844607247247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,2560,0.04628088739183214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,4096,0.09659288989173041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,2048,0.05227999885876974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,3072,0.05211111240916782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,3072,0.0816355546315511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,2048,0.04168000155025058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,1536,0.04092355569203695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,2560,0.07251733541488647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,1024,0.030072000291612413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,1536,0.03426577647527059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,2048,0.06299999687406752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,768,0.022872888379626807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,1536,0.056424889299604625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,1024,0.04798400070932177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,512,0.015827554795477126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,768,0.02371999952528212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,768,0.04536711176236471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,512,0.020583111378881667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,512,0.041300445795059204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,128,0.008291555775536431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,256,0.0344524449772305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,128,0.01792888840039571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,64,0.005982222242487802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,128,0.02825511164135403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,32,0.006235555642180973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,64,0.01789422167672051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,32,0.020578665865792167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,1024,0.02830933199988471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,65536,256,0.010678222609890832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,65536,0.6907697783576118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,65536,256,0.019263111882739596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,65536,1.1163626776801217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,3584,0.08831022183100383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,16384,0.2837297651502821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,65536,51200,0.9591991636488172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,51200,0.5292142232259115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,12288,0.13631021976470947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,12288,0.22442756758795845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,10240,0.168104887008667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,10240,0.11707377433776855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,16384,0.1796942287021213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,8192,0.13794933425055608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,12288,0.19975111219618055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,8192,0.09698488977220322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,7168,0.12000177966223823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,10240,0.17022755410936144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,6144,0.10378755463494195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,7168,0.08384178082148235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,6144,0.07421333260006376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,8192,0.14102666907840306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,5120,0.08915644221835667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,7168,0.1271457804573907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,5120,0.06381422281265259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,6144,0.1124311155743069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,4096,0.07355911201900907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,3584,0.06354577673806085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,16384,0.25792000028822154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,4096,0.05411110983954536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,3072,0.0557733310593499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,3584,0.04917866653866238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,5120,0.09874488910039265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,4096,0.08526221911112468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,2560,0.04745777779155307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,3584,0.07924444145626493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,3072,0.04412710997793409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,2560,0.03975111246109009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,2048,0.03904533386230469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,3072,0.07253333595063952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,51200,0.8790586789449056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,1536,0.030385779009924993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,1024,0.023362666368484497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,2048,0.03578666514820523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,2560,0.06511111391915216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,768,0.01759111053413815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,2048,0.0584462218814426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,1024,0.024859555893474158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,1024,0.043972445858849414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,512,0.012082666986518435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,768,0.020764445265134174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,768,0.041286223464541964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,256,0.008934222161769867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,1536,0.030192000998391047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,512,0.0188746667570538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,1536,0.05146222313245138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,128,0.006278222219811545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,256,0.03269511130121019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,64,0.005602666487296422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,256,0.017450667089886136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,51200,0.7862657970852323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,128,0.02657866643534766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,128,0.01650399963061015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,32,0.01853155593077342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,65536,0.32700710826449925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,65536,0.28393512301974827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,51200,0.25246577792697483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,51200,0.22087821695539686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,65536,1.048359129163954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,16384,0.0871395534939236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,51200,512,0.03793333305252923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,51200,32,0.006301333506902059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,12288,0.0661075578795539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,16384,0.08925422032674153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,10240,0.056332442495557994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,51200,64,0.016152888536453247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,12288,0.06242044766743978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,8192,0.04643199841181437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,10240,0.05598844422234429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,16384,0.0915528866979811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,7168,0.04048177931043837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,12288,0.07385155227449205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,8192,0.04534222351180183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,10240,0.06593955225414701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,6144,0.035608000225490995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,7168,0.04027377896838718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,8192,0.059162669711642794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,5120,0.030928889910380047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,6144,0.03631022241380479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,7168,0.05282577872276306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,4096,0.026068444053332012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,6144,0.04822133315934075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,5120,0.03239999877081977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,3584,0.022991110881169636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,65536,0.2872133255004883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,5120,0.04384711053636339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,4096,0.028466665082507666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,4096,0.03939911060863071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,3072,0.02054933375782437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,2560,0.01759199963675605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,3584,0.02552000019285414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,3072,0.0239955551094479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,2048,0.01423111061255137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,2560,0.02144977781507704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,51200,0.22619199752807617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,1536,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,2048,0.0325617790222168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,2048,0.019896000623703003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,3072,0.0358533329433865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,1024,0.009008888569143083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,768,0.007939555578761632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,1536,0.030079109801186457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,1536,0.017999110950364005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,1024,0.029020445214377508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,512,0.006231110956933763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,1024,0.01623911162217458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,768,0.025935111774338618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,256,0.0041786668201287585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,512,0.02403822210099962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,512,0.014132445057233175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,128,0.0038319999972979226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,256,0.022500443789694045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,256,0.013090666797426013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,64,0.003677333394686381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,16384,32,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,128,0.019539554913838703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,128,0.01312711089849472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,64,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,32,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,65536,0.2451253202226427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,65536,0.23096622361077201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,51200,0.1861928833855523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,3584,0.03826311230659485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,16384,0.06383199824227227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,16384,2560,0.033927109506395124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,51200,0.17962400118509927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,12288,0.05110488997565376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,16384,0.06606133116616143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,10240,0.04240977764129639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,16384,768,0.01514755520555708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,12288,0.052766223748524986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,8192,0.035736001200146146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,12288,0.06764533122380574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,16384,0.08130755689409044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,7168,0.031082666582531396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,8192,0.03856177793608771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,10240,0.0610026650958591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,7168,0.034633778863483004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,8192,0.05310488740603129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,6144,0.02737155556678772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,5120,0.023753777146339417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,7168,0.048560000128216214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,6144,0.031552000178231135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,6144,0.044729779163996376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,4096,0.02106844385464986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,5120,0.027983999914593164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,51200,0.203019552760654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,3584,0.017839999662505258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,5120,0.04079733292261759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,3072,0.015481778317027621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,4096,0.03743733300103082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,3584,0.02309333284695943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,3584,0.036151111125946045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,2560,0.013086222112178802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,3072,0.020624000165197585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,2560,0.01964000033007728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,2560,0.0329093337059021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,2048,0.011689778003427716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,10240,0.0465848876370324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,1536,0.009637333452701569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,2048,0.018407111366589863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,1024,0.008270222279760573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,1536,0.029176887538697984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,1536,0.01685422162214915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,768,0.007151111132568783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,1024,0.014882667197121514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,1024,0.025777777036031086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,512,0.004968889057636261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,768,0.013818666338920593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,768,0.0247999992635515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,256,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,512,0.013068444199032254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,512,0.024689777029885188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,65536,0.2538631227281359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,128,0.003983111017280155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,4096,0.0240346673462126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,256,0.0127368892232577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,256,0.021640888518757288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,64,0.003768889026509391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,128,0.020928000410397846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,12288,32,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,128,0.0123848890264829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,64,0.012080888781282636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,3072,0.03473155697186788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,12288,32,0.012503999802801343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,65536,0.2022648917304145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,51200,0.1578142245610555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,65536,0.2211271127065023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,16384,0.05368266503016154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,51200,0.1744684378306071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,12288,2048,0.03159911102718777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,12288,0.043078223864237465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,10240,0.035931554105546736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,16384,0.06391200092103747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,12288,0.05135022269354927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,8192,0.03093155556254917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,12288,0.0661768913269043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,10240,0.0591191119617886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,8192,0.03747377792994181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,7168,0.026527111728986103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,8192,0.051580445633994214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,6144,0.02331466641690996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,7168,0.03344710999064975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,7168,0.04738222228156196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,51200,0.1958533393012153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,5120,0.020228443874253165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,6144,0.030461334519916113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,4096,0.01754044493039449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,65536,0.2436906761593289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,6144,0.04411910971005758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,5120,0.03974044322967529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,5120,0.02595111065440708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,3584,0.014914666612943014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,3072,0.013385777672131857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,4096,0.02336888843112522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,4096,0.03708444370163812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,3584,0.035720000664393105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,3072,0.02069422271516588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,3072,0.03422666589419047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,2048,0.010026666853162978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,2560,0.019310222731696237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,2560,0.03229866756333245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,1536,0.008601778083377415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,16384,0.07897422048780653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,2048,0.018183110488785636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,2048,0.03029777937465244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,10240,0.045400000280804105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,1536,0.016511110795868766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,1536,0.028943998946083918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,768,0.006005333529578314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,1024,0.025137777129809063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,1024,0.014113777213626437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,512,0.0042462220622433555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,768,0.024680000212457445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,256,0.0038897775941424896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,512,0.013068444199032254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,512,0.024716445141368445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,128,0.003569777641031477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,256,0.022335110439194575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,128,0.01240533341964086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,64,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,10240,128,0.01956533392270406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,32,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,64,0.013003555436929068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,2560,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,32,0.012666666673289405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,65536,0.18843021657731798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,65536,0.17944622039794922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,10240,1024,0.0070053330726093715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,51200,0.14555999967787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,16384,0.04488889045185513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,51200,0.1418186691072252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,768,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,16384,0.05339822173118591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,12288,0.03580977850490146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,256,0.012508444488048553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,16384,0.07380088832643297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,10240,0.029725333054860432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,12288,0.043218665652804904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,65536,0.2264853318532308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,12288,0.06236355834537082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,10240,3584,0.021888888544506494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,51200,0.18172800540924072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,10240,0.038239111502965294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,7168,0.022318222456508215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,10240,0.05654311180114746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,8192,0.031918221049838595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,6144,0.019807111885812547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,8192,0.04905066556400723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,7168,0.027748444014125403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,5120,0.017027555240525138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,7168,0.04605688982539707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,6144,0.025425778494940862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,6144,0.04231199953291151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,5120,0.022653333014912073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,5120,0.038966221941841975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,3584,0.012698666916953193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,4096,0.03636888994110955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,3072,0.011863110793961419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,3584,0.035008000002966985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,3584,0.019495111372735765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,2560,0.010440888504187265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,3072,0.018539556198649935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,3072,0.03358133302794562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,2048,0.00902133352226681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,2560,0.01735466718673706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,1536,0.007963555554548899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,2560,0.032215111785464816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,2048,0.01680888897842831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,2048,0.030415111117892798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,1024,0.006631999793979857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,1536,0.02865155537923177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,1536,0.014552889598740472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,768,0.0052471111218134565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,1024,0.01353422221210268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,1024,0.02529511186811659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,512,0.004468444320890638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,768,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,256,0.0038604442444112566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,512,0.012601777911186218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,512,0.024155555499924555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,128,0.003569777641031477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,256,0.02158044444190131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,256,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,4096,0.0144195556640625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,64,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,128,0.0122417774465349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,32,0.0036391110883818734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,128,0.018901333212852478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,4096,0.020849777592553034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,64,0.012368888490729861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,8192,32,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,65536,0.16179111268785265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,51200,0.1291617817348904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,65536,0.17332622740003797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,16384,0.04542577928966946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,51200,0.13856977886623806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,12288,0.03560355636808608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,16384,0.05232266585032145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,16384,0.07284088929494222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,12288,0.04196977615356445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,10240,0.030086222622129653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,8192,8192,0.02546399997340308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,12288,0.06137510803010729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,8192,0.025448888540267944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,8192,768,0.025382222400771245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,10240,0.0366248885790507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,7168,0.022312000393867493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,8192,0.03068000078201294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,10240,0.056052446365356445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,51200,0.17933155430687797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,6144,0.01959288948112064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,8192,0.048031111558278404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,5120,0.016904888881577384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,7168,0.027016000615225896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,7168,0.04636266827583313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,4096,0.014764444695578681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,6144,0.02496533261405097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,6144,0.04197600152757433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,5120,0.02255022194650438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,3584,0.012132444315486483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,5120,0.038951999611324735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,3072,0.0110880004035102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,4096,0.02089333368672265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,4096,0.03645777702331543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,2560,0.009890666438473595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,3584,0.0347671111424764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,3584,0.019535111056433786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,3072,0.018242667118708294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,2048,0.0086666668454806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,3072,0.03382577829890781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,1536,0.007589333587222629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,2560,0.017501332693629794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,2560,0.031621333625581526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,1024,0.005675555517276128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,2048,0.028378665447235107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,2048,0.01573244399494595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,768,0.004878222114510006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,1536,0.0281315545241038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,1024,0.013693333499961428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,1024,0.024671110841963027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,512,0.004242666479614046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,768,0.025404444999165002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,256,0.003963555726740095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,512,0.012512000070677863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,512,0.025056888659795124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,128,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,256,0.01240533341964086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,256,0.021336000826623704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,64,0.0032764443506797156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,7168,32,0.003567111161020067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,128,0.018915555543369718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,128,0.012081777883900536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,64,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,32,0.012460444536474017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,65536,0.1463866631189982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,65536,0.17037067148420545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,51200,0.11635288927290176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,16384,0.036144001616372004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,51200,0.133440891901652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,16384,0.051009777519438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,12288,0.029249777396519978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,1536,0.014780445231331719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,16384,0.07213511069615682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,10240,0.02427022159099579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,12288,0.04057244459788004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,7168,768,0.01290844463639789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,65536,0.22194488843282065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,8192,0.02142222225666046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,12288,0.06175733274883694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,51200,0.17801333798302543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,10240,0.03478399912516276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,7168,0.0181048893266254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,6144,0.01590044465329912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,10240,0.05517333414819506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,8192,0.030016889174779255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,8192,0.047835555341508657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,7168,0.026362667481104534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,7168,0.04490310947100321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,5120,0.013829333086808523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,4096,0.012135110795497894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,6144,0.024381332927280005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,6144,0.04188977678616842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,3584,0.011021333436171213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,5120,0.03872444563441806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,5120,0.022288888692855835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,7168,65536,0.22371199395921496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,4096,0.020282665888468426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,3072,0.009914666414260864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,2560,0.008943110704421997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,3584,0.019307555423842538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,2048,0.007843555675612556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,3072,0.03291644321547614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,2560,0.016904888881577384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,2560,0.03158222304450141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,1536,0.0069439998931354946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,2048,0.015394666128688388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,2048,0.028813332319259644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,1024,0.005121777868933148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,1536,0.026337777574857075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,1536,0.014259555273585849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,768,0.004504000147183736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,1024,0.025408888856569927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,1024,0.013207111093733044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,512,0.0041911109454101985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,768,0.012801777985360889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,768,0.02570488883389367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,256,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,512,0.024383111132515803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,512,0.012381333443853589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,128,0.003264888914095031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,256,0.012415111064910889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,256,0.021948445174429152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,64,0.0032275555034478507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,6144,32,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,128,0.019903111788961623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,64,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,32,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,65536,0.11940799819098578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,51200,0.09683110978868271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,4096,0.03563288847605387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,65536,0.16416800022125244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,6144,3584,0.03468799922201369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,16384,0.03944889042112563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,16384,0.050048887729644775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,51200,0.12818311320410833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,12288,0.031172444423039753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,16384,0.07248000303904216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,12288,0.0388408899307251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,10240,0.02222488820552826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,12288,0.06105066670311821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,65536,0.2190986606809828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,51200,0.17511733373006186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,8192,0.018956444329685636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,10240,0.033430222007963396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,10240,0.054582221640480884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,7168,0.016452444924248587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,8192,0.02840977907180786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,8192,0.047825776868396334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,6144,0.014422222971916199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,128,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,7168,0.026076444321208533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,7168,0.04504444532924228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,5120,0.013369777964221107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,4096,0.011438222395049201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,6144,0.02379111117786831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,5120,0.038895110289255776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,5120,0.021947556071811255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,3584,0.010026666853162978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,4096,0.020188444190555148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,3072,0.009307555854320526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,3584,0.03472355670399136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,3584,0.018816888332366943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,2560,0.008289777570300633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,6144,3072,0.01796533332930671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,3072,0.03319733341534933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,2048,0.007419555551475949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,2560,0.015543111496501498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,2048,0.01514311134815216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,2048,0.027416000763575237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,1536,0.006229333165619109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,1536,0.026699556244744196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,1536,0.014083556003040738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,1024,0.0047644442982143825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,1024,0.025714667307005987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,768,0.004234666625658671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,6144,0.04120444589191013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,768,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,512,0.0041911109454101985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,768,0.0233324451578988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,256,0.0038328886859946777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,4096,0.03533600105179681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,512,0.023294222023752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,512,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,128,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,256,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,256,0.022668444448047217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,64,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,128,0.019280888968043856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,3072,0.01754844519827101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,5120,32,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,5120,2560,0.031228442986806233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,64,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,65536,0.09715288877487183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,51200,0.07840710878372192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,65536,0.1232302188873291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,16384,0.03185155656602647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,51200,0.09927022457122803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,16384,0.03776266508632236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,12288,0.02553155521551768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,1024,0.01313688854376475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,16384,0.07204888926612006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,10240,0.018937778141763475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,65536,0.21816621886359322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,51200,0.17439556121826172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,12288,0.0602017773522271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,8192,0.01661777827474806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,10240,0.02713955607679155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,10240,0.054216000768873424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,7168,0.01441422270403968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,8192,0.04715377754635281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,8192,0.023473777704768713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,6144,0.012988444831636218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,7168,0.021038222644064162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,7168,0.04452444447411431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,128,0.012064889073371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,6144,0.020243555307388306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,6144,0.04053599966896905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,4096,0.01054222219520145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,5120,0.018908444378111098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,5120,0.037913779417673744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,3584,0.009339555270142024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,4096,0.01739022301303016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,4096,0.03497066762712266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,3072,0.008279110822412703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,3584,0.01649688846535153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,3584,0.033831109603246055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,2560,0.0075795559419526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,3072,0.015056000815497505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,3072,0.03257333238919576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,2048,0.006937777830494775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,2560,0.014779556128713818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,2560,0.029743111795849268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,1536,0.005374222166008419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,2048,0.013526221944226159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,2048,0.026777777406904433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,1024,0.00453333349691497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,1536,0.013459555804729462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,1536,0.026288888520664636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,768,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,12288,0.02975377771589491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,1024,0.012460444536474017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,512,0.0035582222044467926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,768,0.025034666061401367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,768,0.012433778080675336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,256,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,512,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,512,0.024323556158277724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,128,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,256,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,256,0.021606221795082092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,5120,0.0116462219092581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,64,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,4096,32,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,5120,32,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,64,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,32,0.011502222054534487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,65536,0.08362933662202622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,51200,0.06850488980611165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,65536,0.12141333685980903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,51200,0.09501866499582927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,16384,0.029594666428036157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,1024,0.025070221887694463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,65536,0.21665333376990425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,16384,0.035989334185918175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,51200,0.17455377843644884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,16384,0.0710773335562812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,10240,0.02187999917401208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,12288,0.029159112109078303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,12288,0.059756444560156934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,8192,0.015309333801269531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,10240,0.05385155479113261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,4096,128,0.01956355571746826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,7168,0.013783111340469785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,8192,0.02286400066481696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,6144,0.012304888831244575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,7168,0.021359999974568684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,7168,0.043551110559039645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,5120,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,6144,0.01977599991692437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,6144,0.040617777241600886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,4096,0.009782222410043081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,5120,0.018194667167133756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,5120,0.03737066520584954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,3584,0.008966222405433655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,4096,0.016885333591037326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,4096,0.03491466575198703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,3072,0.008278222547637092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,3584,0.034104890293545194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,3072,0.01479466590616438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,12288,0.024554666545655992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,2560,0.007300444775157505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,3072,0.030489779180950586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,2048,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,2560,0.028772443532943726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,2560,0.014031110538376702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,1536,0.004920888692140579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,2048,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,2048,0.02712000078625149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,10240,0.02660977840423584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,4096,128,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,1024,0.00424799985355801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,768,0.0038773334688610504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,1536,0.013085333009560903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,1024,0.025359110699759588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,8192,0.04704977737532722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,512,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,768,0.012298666768603854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,768,0.02330933345688714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,256,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,512,0.024382222029897902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,512,0.012450666891203986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,128,0.003335111050142182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,256,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,256,0.020977778567208186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,64,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3584,32,0.00314666661951277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,128,0.0196142229768965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,64,0.011401777466138205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,65536,0.07589333587222628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,32,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,3584,0.015644444359673392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,51200,0.06223377916547987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,65536,0.11807110574510361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,16384,0.025366221865018208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,51200,0.09401955869462754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,16384,0.03493155704604255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,16384,0.07081511285569933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,12288,0.02194044490655263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,65536,0.2166435586081611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3584,1536,0.026092444856961567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,10240,0.0177831103404363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,1024,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,12288,0.0591377748383416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,8192,0.016186666157510545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,10240,0.026439110438028973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,10240,0.053957333167394005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,7168,0.013786666923099093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,8192,0.022042666872342426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,8192,0.04686399963166979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,6144,0.011747555600272285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,7168,0.02082577844460805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,7168,0.043839110268486865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3584,128,0.011742221812407175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,5120,0.010978666444619497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,6144,0.040411555104785495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,6144,0.01958577831586202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,4096,0.009418666362762451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,5120,0.0377768874168396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,5120,0.018271999226676095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,3584,0.008678221868144141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,4096,0.034448888566758894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,4096,0.015796444482273526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,3072,0.007963555554548899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,3584,0.031606223848130964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,3584,0.015152000718646579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,3072,0.014473777678277759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,2560,0.007489778101444244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,3072,0.03035199973318312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,2048,0.006280888699822956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,2560,0.029143999020258587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,2048,0.026437333888477747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,2048,0.013455111119482251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,1536,0.00526311124364535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,1024,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,51200,0.17390133274926078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,1536,0.02532888948917389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,1536,0.013070222404268054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,768,0.004168888760937585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,1024,0.012471111284361945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,512,0.0038728887836138406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,1024,0.02331466641690996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,768,0.02370400064521366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,768,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,256,0.0034755555291970572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,128,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,512,0.022649778260125056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,256,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,64,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,128,0.01889244384235806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,128,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,3072,32,0.0032524443748924467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,64,0.011433777709801992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,65536,0.06326755550172594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,32,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,51200,0.05260089039802551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,65536,0.11637332704332139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,51200,0.09069599707921346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,2560,0.014184888866212634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,16384,0.022944889134830896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,65536,0.2152871158387926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,12288,0.019101333287027147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,16384,0.03381333417362637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,12288,0.02847911251915826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,51200,0.17367733849419487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,10240,0.017166222135225933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,12288,0.059506667984856494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,3072,512,0.012182222472296821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,10240,0.02572533322705163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,10240,0.05345066719584995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,3072,256,0.021963554951879714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,7168,0.014076444837782117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,8192,0.046345776981777616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,8192,0.022146667043368023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,6144,0.012822222378518848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,7168,0.04340177774429321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,7168,0.020523554748959012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,5120,0.010337777435779572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,6144,0.01920977731545766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,6144,0.04014488723542955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,4096,0.00924622184700436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,5120,0.03647111190689935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,5120,0.01756355497572157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,3584,0.008271999657154083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,4096,0.01608444419172075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,4096,0.033019555939568415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,3072,0.007584888901975419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,3584,0.014775110615624322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,3584,0.03185688787036472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,2560,0.006779555645253923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,3072,0.030135111676322088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,3072,0.014440000057220459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,2048,0.005625777774386936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,2560,0.013804444836245643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,2560,0.028668443361918133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,16384,0.07016088565190633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,2048,0.013463111387358772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,2048,0.02631644407908122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,1024,0.004508444418509801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,1536,0.012792000340090858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,1536,0.025377778543366328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,768,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,12288,0.028055999014112685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,1024,0.0123848890264829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,1024,0.024333332975705464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,512,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,8192,0.015013333823945789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,256,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,768,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,128,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,512,0.02370311154259576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,512,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,256,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,256,0.02159999973244137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,64,0.0028986665937635633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,128,0.019557333654827543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,128,0.011413333316644033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,32,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,65536,0.05348711212476095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,64,0.011416888899273343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2560,32,0.011693333586057028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,51200,0.04400622182422214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,65536,0.11303644710116917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,16384,0.019174221489164565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,51200,0.09001777569452922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,16384,0.033048888047536217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,65536,0.21470044718848336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,16384,0.07021866904364692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,12288,0.015472888946533203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,10240,0.014456000592973499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2560,1536,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,12288,0.059021333853403725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,8192,0.014094221923086377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,10240,0.025432889660199482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2560,768,0.0236435549126731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,8192,0.04658755660057068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,7168,0.012703999876976013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,7168,0.02010311186313629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,7168,0.04342844420009189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,6144,0.011666666302416058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,6144,0.018253333038753934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,6144,0.04023199942376878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,5120,0.010323555933104621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,5120,0.017436444759368896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,4096,0.008661333057615492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,51200,0.1728817754321628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,4096,0.015881778465376962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,3584,0.008263111114501953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,4096,0.032650666104422674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,12288,0.027592000034120347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,3072,0.007263999846246507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,3584,0.014918223023414612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,3584,0.031508445739746094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,2560,0.006587555425034628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,8192,0.021593777669800654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,3072,0.030415998564826116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,2048,0.005583999885453119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,2560,0.02836444311671787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,2560,0.014103111293580798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,1536,0.004568888909286923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,2048,0.013411555853154926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,2048,0.027466666367318895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,1024,0.0041697778635554844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,1536,0.013096888860066732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,1536,0.02606044378545549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,768,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,1024,0.012712889247470431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,1024,0.02470933397610982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,512,0.003524444583389494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,768,0.024000888069470722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,768,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,256,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,512,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,512,0.024282667371961806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,128,0.003133333391613431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,256,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,64,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,128,0.01926399932967292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,128,0.011791999969217511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,2048,32,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,65536,0.04333600070741442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,64,0.011134222149848938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,32,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,10240,0.05317066775427925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,65536,0.10968889130486383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,2048,3072,0.014119999276267158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,16384,0.014896889527638754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,65536,0.2150648832321167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,16384,0.03221333358022902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,16384,0.06993155346976386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,12288,0.014293332894643148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,12288,0.05858577622307671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,12288,0.02740977704524994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,10240,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,5120,0.035535110367669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,8192,0.01129333343770769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,2048,256,0.02234755622016059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,10240,0.02496444516711765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,10240,0.0530426667796241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,7168,0.010991999672518836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,8192,0.0209840006298489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,8192,0.046332445409562856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,6144,0.01036977767944336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,7168,0.01907999979125129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,7168,0.04131822122467889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,5120,0.009600888523790572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,51200,0.03493422269821167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,6144,0.017856889300876193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,4096,0.008647110727098253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,5120,0.035982221364974976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,3584,0.00741244438621733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,4096,0.015228443675571017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,4096,0.032590223683251276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,51200,0.08807822068532307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,3072,0.006665777828958299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,3584,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,3584,0.03192799952295091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,2560,0.005976888868543837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,51200,0.17316088411543104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,3072,0.03011022342575921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,3072,0.014383999837769402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,2048,0.005365333209435145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,2560,0.014111111561457316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,2560,0.02878755662176344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,2048,0.026710222164789837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,2048,0.013418667018413544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,1024,0.004280888785918553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,1536,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,1536,0.025384889708624944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,768,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,1024,0.01240355521440506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,1024,0.024448888169394598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,512,0.003488000068399641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,768,0.01202755586968528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,768,0.02392622166209751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,256,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,512,0.01205599970287747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,512,0.023344000180562336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,6144,0.03824266791343689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,128,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,5120,0.016499555773205228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,256,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,64,0.002936888900068071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,256,0.022280888424979314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,32,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1536,128,0.018577777677112155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,128,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,65536,0.03164800008138021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,64,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,51200,0.02534666657447815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1536,32,0.011078221930397881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,16384,0.012724444270133972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,65536,0.10653422276178996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,51200,0.08494044674767388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,12288,0.013807111316257052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,16384,0.032186667124430336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,16384,0.06980711221694946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,65536,0.21538310580783418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,51200,0.17379644181993273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,10240,0.012627555264366997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,8192,0.010947555303573608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,12288,0.026735999517970618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1536,1536,0.004893333133724001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,12288,0.05795644389258491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,7168,0.010388444695207808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,10240,0.05184444453981188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,10240,0.023717333873112995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,6144,0.00963466697269016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,8192,0.01994755533006456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,5120,0.00885511106914944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,8192,0.045180443260404796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,7168,0.04191022117932638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,7168,0.018920888503392536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,6144,0.0373564428753323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,6144,0.01755911111831665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,5120,0.03496444556448195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,3584,0.007179555793603261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,5120,0.016531555189026725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,3072,0.006540444576077991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,4096,0.03259377678235372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,4096,0.014820444915029736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,2560,0.00591555568906996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,3584,0.01442311041884952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,3584,0.03109333250257704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,2048,0.005202666752868229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,3072,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,3072,0.030256887276967365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,1536,0.004592888885074192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,2560,0.0288080010149214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,1024,0.003921777837806278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,2048,0.02677333354949951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,1536,0.012740444805887012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,768,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,1024,0.024326221810446844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,768,0.012175111307038201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,768,0.0236835562520557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,512,0.0034088889757792154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,512,0.023473777704768713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,512,0.011768889096048145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,256,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,256,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,128,0.0028782222006056043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,4096,0.007958222594526079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,128,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,128,0.018583110637134977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,64,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,1024,32,0.0025804444319672054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,64,0.01126933346192042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,2560,0.013716444373130798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,32,0.011012444065676795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,65536,0.027497778336207073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,2048,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,51200,0.02291999922858344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,1536,0.025980444418059453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,1024,1024,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,65536,0.10418933629989624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,16384,0.013426666458447775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,51200,0.08311111397213407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,65536,0.21528800328572592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,12288,0.011961778004964193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,10240,0.011339555184046427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,16384,0.03186310993300544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,16384,0.07013689147101508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,8192,0.009686222506894005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,12288,0.05727466609742907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,12288,0.024967110819286768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,10240,0.02268444498380025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,7168,0.009171555439631144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,10240,0.05085777905252245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,6144,0.008635555704434713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,8192,0.044215109613206655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,8192,0.01998666591114468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,1024,256,0.022410665949185688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,7168,0.0410151117377811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,7168,0.019089778264363606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,6144,0.017530666457282174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,6144,0.037704888317320086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,4096,0.007978666987684038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,3584,0.007345777418878343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,5120,0.03467466764979892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,5120,0.016488000750541687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,3072,0.006583999842405319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,4096,0.032518221272362605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,4096,0.014811555544535318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,3584,0.03087466624048021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,2560,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,3584,0.014420444766680399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,2048,0.005222222043408289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,3072,0.014113777213626437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,3072,0.030187557140986126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,1536,0.004575110971927643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,2560,0.028079112370808918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,2560,0.013468444347381592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,2048,0.027060444156328838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,1024,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,2048,0.013268444273206921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,768,0.003626666549179289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,1536,0.025747555825445387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,1536,0.013063111239009433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,512,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,1024,0.02437155610985226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,1024,0.01237777786122428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,768,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,768,0.02309866746266683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,512,0.023250665929582384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,512,0.012040889097584618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,128,0.0028071111689011254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,256,0.02126755482620663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,256,0.011502222054534487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,64,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,32,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,128,0.018858666221300762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,128,0.011713777979214987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,65536,0.02093688812520769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,64,0.0110871113008923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,51200,0.016799110505315993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,768,32,0.011018666956159802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,5120,0.00796977761718962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,16384,0.011166222393512726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,65536,0.10361422432793511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,65536,0.21560977564917672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,51200,0.08073333236906263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,16384,0.03160088923242357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,12288,0.009565333525339762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,16384,0.0688471131854587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,10240,0.009705777797434065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,12288,0.025080889463424683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,12288,0.05740000141991509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,10240,0.023032888770103455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,8192,0.008295111358165741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,7168,0.007999111380841997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,8192,0.044157332844204374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,8192,0.01992177797688378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,6144,0.007346666521496243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,7168,0.01847822301917606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,7168,0.041617777612474226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,5120,0.008000888758235509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,768,51200,0.17458577950795492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,6144,0.01754844519827101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,6144,0.037364443143208824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,4096,0.007599111232492659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,5120,0.016507556041081745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,5120,0.03563288847605387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,3584,0.006924444602595435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,4096,0.01483022173245748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,4096,0.03219466739230686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,3072,0.006291555447710886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,3584,0.014829332629839579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,3584,0.03151466780238681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,2560,0.00590844452381134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,3072,0.02951822347111172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,2048,0.005214222189452913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,2560,0.013798221945762634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,2560,0.02879377868440416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,51200,0.17310933272043863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,1536,0.00452888881166776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,2048,0.027428444888856676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,2048,0.01314933349688848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,1024,0.0039048890272776284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,10240,0.05116888880729675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,1536,0.012448888685968188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,1536,0.026076444321208533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,768,0.003527111063400904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,1024,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,1024,0.0240631103515625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,512,0.0034942221310403612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,768,0.012240889171759287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,256,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,768,256,0.0031991110493739447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,512,0.023362666368484497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,128,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,256,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,256,0.022171555293930903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,64,0.002524444419476721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,128,0.011759111450778114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,512,32,0.0025475554996066624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,64,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,3072,0.014092443717850579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,65536,0.016139555308553908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,32,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,51200,0.014021333720948962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,65536,0.09840710957845052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,65536,0.21555288632710776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,16384,0.009697777529557547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,51200,0.17319733566708037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,16384,0.029831111431121826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,12288,0.008435555630260045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,768,0.023023999399609033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,16384,0.06702488660812378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,10240,0.008977777428097194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,512,512,0.011744889120260874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,12288,0.056186669402652316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,8192,0.00811288919713762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,10240,0.05011466807789273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,10240,0.02269511090384589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,7168,0.007988444632954067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,512,128,0.019955555597941082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,8192,0.04313955704371134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,8192,0.0192248887485928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,6144,0.007273777491516537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,7168,0.018539556198649935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,5120,0.007978666987684038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,7168,0.04144088758362664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,4096,0.007289778027269576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,6144,0.037704888317320086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,6144,0.017196445001496207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,5120,0.034576889541414045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,3584,0.006953777538405524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,5120,0.016224000189039443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,3072,0.006565333240562015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,4096,0.015198222464985318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,4096,0.03183999988767836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,2560,0.006346666564544042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,3584,0.030862222115198772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,3584,0.014117333624098035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,51200,0.07801689041985406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,2048,0.006223111102978389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,3072,0.013944000005722046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,3072,0.03016888764169481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,1536,0.004229333251714706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,2560,0.02808977829085456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,2560,0.013362666798962487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,2048,0.01329066687160068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,2048,0.02641244398223029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,1024,0.0038604442444112566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,768,0.0035911111368073356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,1536,0.025702221526039973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,1536,0.012998222476906247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,512,0.0032071111102898917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,1024,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,1024,0.02404800057411194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,256,0.0028782222006056043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,768,0.023415111833148535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,128,0.002620444529586368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,512,0.012080888781282636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,512,0.023033777872721355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,12288,0.02500711050298479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,256,0.011720000041855706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,32,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,128,0.019931554794311523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,128,0.011022222538789114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,65536,0.015448888142903646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,64,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,51200,0.013051555388503604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,32,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,65536,0.09841866625679864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,16384,0.009647111097971598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,65536,0.21525688966115317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,51200,0.07682044638527764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,51200,0.17275910907321504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,12288,0.008288000192907121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,16384,0.02948444419436985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,16384,0.0673182209332784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,12288,0.0561386677953932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,10240,0.007723555796676212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,10240,0.05031466815206739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,10240,0.02269422180122799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,8192,0.007282666862010956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,8192,0.01956977778010898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,8192,0.04415377643373278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,7168,0.0069822221994400024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,256,64,0.002475555572244856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,256,256,0.02130844526820713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,6144,0.006587555425034628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,7168,0.018888889087571036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,5120,0.006271111054552927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,6144,0.03753688931465149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,6144,0.01722666621208191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,4096,0.006653333289755716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,5120,0.016563556260532804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,5120,0.03458399905098809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,3584,0.006303999986913469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,4096,0.014767110347747803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,4096,0.03256444467438592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,3072,0.00628355559375551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,3584,0.030605332718955144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,3584,0.01444355481200748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,2560,0.006247111078765657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,12288,0.024915556112925213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,3072,0.014146667387750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,2048,0.006110222389300664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,3072,0.029506666792763606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,2560,0.028785778416527644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,2560,0.013456888496875763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,1536,0.004519999855094486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,2048,0.025685333543353613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,2048,0.013456888496875763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,1024,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,1536,0.02609511050913069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,1536,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,256,768,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,1024,0.02313422163327535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,1024,0.012469333079126147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,512,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,768,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,256,0.003112888791494899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,7168,0.04108711083730062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,512,0.022639999787012737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,512,0.012200000385443369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,128,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,256,0.022299556268586054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,256,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,128,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,65536,0.013944000005722046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,64,0.011411555939250521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,51200,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,65536,0.09633511304855347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,16384,0.008296888735559251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,51200,0.07577777571148343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,12288,0.007672000262472365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,16384,0.029917332861158583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,10240,0.007290666302045186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,12288,0.02490666674243079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,8192,0.0069208890199661255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,10240,0.022633777724372015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,768,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,7168,0.006589333216349284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,8192,0.019559999306996662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,6144,0.006592000110281839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,768,0.0233262214395735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,7168,0.018588445252842374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,4096,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,6144,0.017400888933075797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,3584,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,128,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,128,128,128,0.018195556269751657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,4096,0.014950222439236112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,2560,0.006250666661394968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,3584,0.014426666829321118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,2048,0.0059004442559348206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,128,32,0.01163644426398807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,3072,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,1536,0.004583111239804162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,2560,0.013755555782053204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,1024,0.003531555748648114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,768,0.003536888708670934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,2048,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,1536,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,1024,0.012113778127564324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,256,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,768,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,128,0.00254133323000537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,512,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,64,0.002491555487116178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,256,0.011429333024554782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,32,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,128,0.011500444677140979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,65536,0.01365244471364551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,64,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,51200,0.01203644441233741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,32,0.011382222175598145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,5120,0.006281777802440856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,65536,0.09576444493399726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,16384,0.008066666622956594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,51200,0.07493155532413058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,12288,0.007592889169851939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,10240,0.007321777443091075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,64,5120,0.016048888365427654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,8192,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,3072,0.006064888917737537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,12288,0.024728000164031982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,7168,0.00657155571712388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,10240,0.022631999519136217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,6144,0.00629333323902554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,5120,0.006245333287451003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,8192,0.019235556324323017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,4096,0.005903999838564131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,7168,0.0181377778450648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,3584,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,6144,0.01724177764521705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,3072,0.005611555443869696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,64,512,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,4096,0.014767999450365702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,2560,0.0064737776087390045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,3584,0.014092443717850579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,3072,0.013765333427323235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,2560,0.01311822235584259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,2048,0.012748444245921241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,1024,0.003677333394686381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,1536,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,768,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,1024,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,512,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,768,0.011759111450778114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,256,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,512,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,128,0.00254133323000537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,16384,0.029826667573716905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,256,0.011188444164064197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,64,0.002518222149875429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,32,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,128,0.011028444601429833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,64,0.010683555569913654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,32,0.011506666739781698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,128,32,5120,0.015858666764365304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,2048,0.0058808889653947614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,128,32,1536,0.00424177779091729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,12288,0.2829359902275933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,16384,0.22055466969807944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,12288,0.16564088397555882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,10240,0.23651822408040366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,51200,0.6611955430772569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,10240,0.13968711429172093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,7168,0.1704097721311781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,8192,0.11846578121185303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,6144,0.14572266737620035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,7168,0.10128355688518947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,51200,1.1461448669433594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,5120,0.12265688843197292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,5120,0.07596800062391493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,3584,0.08833244774076675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,6144,0.08900177478790283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,3072,0.07679288917117648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,3584,0.05825510952207777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,3072,0.0517137779129876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,2560,0.0642791125509474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,2048,0.05225955446561178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,4096,0.06404178010092841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,2560,0.04588355620702108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,16384,0.37258044878641766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,1536,0.04069777660899692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,2048,0.040992889139387347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,768,0.022421333524915908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,1536,0.034188446071412824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,512,0.015612444943851896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,256,0.010612444745169746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,8192,0.19063822428385416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,768,0.024845333562956914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,1024,0.02833333280351427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,512,0.020921778347757127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,64,0.00590844452381134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,256,0.019256000717480976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,32,0.006286222073766921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,128,0.017887110511461895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,64,0.017508443858888414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,65536,32,0.02040799955526988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,4096,0.09932621982362534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,16384,0.2832871013217502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,51200,0.5253289010789659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,1024,0.029412445094850328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,65536,0.6825120184156629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,51200,0.8776257832845052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,65536,1.1148977279663086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,12288,0.13485156165228948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,12288,0.2148604393005371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,10240,0.16823555363549125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,65536,128,0.00793333351612091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,16384,0.1786515580283271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,8192,0.13852889007992214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,7168,0.11977688471476237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,6144,0.10328533252080281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,8192,0.09652177492777507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,10240,0.11345867315928142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,6144,0.07351377937528822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,4096,0.07389777898788452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,3584,0.06373333268695407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,5120,0.0887262225151062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,4096,0.05338755581114027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,7168,0.08301511075761583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,3072,0.05564800235960218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,2560,0.04713955521583557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,2048,0.03887110948562622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,1536,0.030080000559488933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,3072,0.043755554490619235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,2560,0.03953244288762411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,1024,0.023349333140585158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,768,0.017836444907718234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,2048,0.03554577628771464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,1536,0.029849777619043987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,512,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,256,0.008953777452309927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,1024,0.024233778317769367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,128,0.006447111152940326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,768,0.021549334128697712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,64,0.005906666732496685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,51200,32,0.006239111224810283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,256,0.01754844519827101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,128,0.016551999582184684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,64,0.017860444055663217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,32,0.01841600073708428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,65536,0.3245306544833713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,51200,0.25036178694831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,65536,0.2769040001763238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,16384,0.08578133583068848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,51200,0.21517954932318795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,12288,0.06567466921276517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,10240,0.055833776791890465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,16384,0.0783440007103814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,8192,0.04646133383115133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,5120,0.0629626644982232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,3584,0.048972444401847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,7168,0.04122399952676561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,10240,0.05126666691568163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,12288,0.061166220241122775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,6144,0.03586666782697042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,5120,0.030629333522584703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,8192,0.04458666510052151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,3584,0.023108444280094568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,6144,0.03597777750757005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,7168,0.03982133335537381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,3072,0.020498666498396132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,2560,0.017675555414623685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,51200,512,0.01905422243807051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,2048,0.014408000641398959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,3072,0.023307555251651343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,2560,0.021347555849287245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,1536,0.011739555332395764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,1024,0.009648888475365108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,2048,0.019613333874278598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,1536,0.017857778403494094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,768,0.00793599999613232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,1024,0.016136889656384785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,768,0.015042665931913586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,256,0.004520888957712385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,256,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,128,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,128,0.012741333080662621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,64,0.0035546666218174826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,4096,0.026366222235891554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,32,0.0038328886859946777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,5120,0.03182933396763272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,64,0.012431999875439538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,3584,0.026050666968027752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,32,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,65536,0.24356089697943795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,51200,0.18854133288065592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,16384,0.06465688678953382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,65536,0.22580978605482313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,16384,512,0.006260444306664997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,51200,0.17537332905663383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,12288,0.05017955435646904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,10240,0.04217866725391812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,8192,0.036064889695909284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,12288,0.05163733495606316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,16384,0.06545422474543254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,10240,0.04349777764744229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,6144,0.027264888087908428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,5120,0.023796444137891132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,4096,0.020601777566803824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,6144,0.030697776211632624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,7168,0.0340595543384552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,5120,0.02741688821050856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,3584,0.017665778597195942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,3072,0.015442666080262927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,2560,0.013442666994200813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,4096,0.02332177758216858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,3584,0.022277333670192297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,2048,0.011427555647161273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,3072,0.020958221620983545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,1536,0.009687999884287516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,1024,0.008286221987671321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,2560,0.019613333874278598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,4096,0.02786133355564541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,2048,0.01827111177974277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,768,0.006948444578382704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,1536,0.017108443710539076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,1024,0.014828445182906257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,768,0.014440889159838358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,256,0.0041751112374994485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,128,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,512,0.013407111167907715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,64,0.003555555724435382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,128,0.012230222423871359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,256,0.012831110921170978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,32,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,64,0.013417777915795645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,7168,0.030728889836205378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,65536,0.2056657738155789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,8192,0.0377200014061398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,51200,0.1566915512084961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,65536,0.21553066041734484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,12288,0.04297955499755012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,51200,0.16911821895175508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,10240,0.03591022226545546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,16384,0.0632257792684767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,12288,0.05016711023118761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,8192,0.030177778667873804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,7168,0.026307556364271376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,12288,512,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,10240,0.042075554529825844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,6144,0.02309688925743103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,8192,0.03701333204905192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,5120,0.020267556111017864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,7168,0.03287555442916022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,4096,0.017456889152526855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,6144,0.0299288895395067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,3584,0.014862222803963555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,5120,0.02591111097070906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,3072,0.01314933349688848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,4096,0.022967111733224656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,2560,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,3584,0.021839110387696162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,2048,0.010236444572607676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,3072,0.02058577703105079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,1536,0.00832711077398724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,2560,0.01926399932967292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,12288,32,0.01351999988158544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,1024,0.0069368887278768755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,768,0.005283555636803309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,2048,0.017860444055663217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,512,0.004505777938498391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,1536,0.01649688846535153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,256,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,128,0.003567111161020067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,16384,0.05484977695677015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,768,0.013901333014170328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,64,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,512,0.0131217779384719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,256,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,10240,32,0.0035502223504914176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,128,0.01236977759334776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,64,0.012749333348539142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,32,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,16384,0.04895288745562235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,51200,0.1420995526843601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,65536,0.1738871071073744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,12288,0.038020445240868464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,51200,0.13573511441548666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,10240,0.03187111020088196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,16384,0.05249599946869744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,8192,0.0277502222193612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,7168,0.023976888921525743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,10240,0.03511910968356662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,8192,0.03116977877087063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,6144,0.021262221866183813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,5120,0.018036444981892902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,7168,0.028076443407270644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,4096,0.015383111106024848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,6144,0.02472711106141408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,3584,0.012705778082211813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,16384,512,0.013806222213639153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,3072,0.011672000090281168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,4096,0.02051911089155409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,3584,0.01956355571746826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,10240,1024,0.014110222458839417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,2560,0.0101742222905159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,2048,0.009009777671760982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,3072,0.01854311095343696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,1536,0.007659555309348636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,1024,0.00645955569214291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,2560,0.01754844519827101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,2048,0.016536888149049547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,768,0.004879999905824661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,512,0.00453599997692638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,1024,0.013463999662134381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,65536,0.18497333261701795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,256,0.0038773334688610504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,768,0.013648000028398303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,128,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,512,0.012791111237472959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,64,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,128,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,256,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,8192,32,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,64,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,32,0.013074666261672974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,65536,0.16228977839152017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,65536,0.17134043905470106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,51200,0.12862311469184026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,5120,0.022655111220147874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,16384,0.050386667251586914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,12288,0.035678221119774714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,51200,0.1327635579639011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,10240,0.029701332251230877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,16384,0.05117333266470167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,8192,0.02600266701645321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,12288,0.041117333703570895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,7168,0.022582223018010456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,6144,0.019662222928471036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,10240,0.033936000532574125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,8192,0.029735998974906072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,5120,0.01684711045689053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,7168,0.026368889543745253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,4096,0.014654222461912366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,6144,0.024481778343518574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,5120,0.022104000051816303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,4096,0.019987555013762582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,3072,0.010863111250930362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,3584,0.019465777609083388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,3072,0.018234666850831773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,12288,0.041952000723944775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,2048,0.008661333057615492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,2560,0.017532444662517972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,1536,0.0076453329788313965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,1024,0.005935110979610019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,2048,0.01568266749382019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,768,0.005205333232879639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,1024,0.013367111484209696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,512,0.00424799985355801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,256,0.003948444293604957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,768,0.013412444127930535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,128,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,512,0.012771555946932899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,256,0.012099555797047086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,64,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,32,0.003896000070704354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,128,0.011766222616036734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,64,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,32,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,8192,1536,0.014882667197121514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,65536,0.14419733153449163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,3584,0.012108444339699216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,16384,0.04372355673048231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,51200,0.11431288719177246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,12288,0.02902666727701823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,65536,0.16355821821424696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,7168,2560,0.009640889035330879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,16384,0.04970488945643107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,10240,0.02444177700413598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,51200,0.12838933202955458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,7168,0.0181048893266254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,8192,0.021008888880411785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,12288,0.038783109850353666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,6144,0.016188444362746347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,5120,0.014138667119873894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,10240,0.032962666617499456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,4096,0.012395555774370829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,8192,0.028763555818133887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,7168,0.026404443714353774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,3584,0.01127199994193183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,3072,0.009999111294746399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,6144,0.02366399930583106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,5120,0.02145066691769494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,2560,0.008756444685988957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,4096,0.019897777173254225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,7168,1536,0.014527999692493014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,3584,0.019108444452285767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,3072,0.018182223041852314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,1024,0.004967111266321606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,2560,0.01685688893000285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,768,0.004312889029582341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,2048,0.015124445160230001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,512,0.0041244443919923575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,1536,0.014459555347760519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,256,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,1024,0.01311822235584259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,128,0.0033244445092148254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,768,0.013464888764752282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,64,0.0029493332323100832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,512,0.01276088919904497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,32,0.0032026666320032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,256,0.012097777591811286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,128,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,64,0.012033777932325998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,65536,0.11630222532484268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,6144,32,0.012134222520722283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,51200,0.09434933132595485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,16384,0.039361778232786394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,12288,0.030692444907294378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,65536,0.15923999415503606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,10240,0.027455111344655354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,16384,0.04816533459557427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,51200,0.12583555115593806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,8192,0.019141332970725167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,12288,0.03765689002143012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,7168,0.016484444340070088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,6144,0.014767999450365702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,8192,0.027790221903059218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,5120,0.012820444173283048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,7168,0.02548177705870734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,4096,0.01163200040658315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,6144,0.023795555035273235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,3584,0.009977777798970541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,5120,0.02143200072977278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,2048,0.007682667010360294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,6144,1536,0.006912888752089606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,3072,0.009313777916961247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,4096,0.019626667102177937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,2560,0.008270222279760573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,2048,0.007296889192528195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,3584,0.018713777263959248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,1536,0.006230222268237009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,3072,0.01742755538887448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,1024,0.004874666531880696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,2560,0.01569333341386583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,768,0.004243555582231945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,2048,0.01479288935661316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,512,0.003912888881233004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,1536,0.014135999812020196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,1024,0.013182222015327878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,768,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,128,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,512,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,64,0.002938666691382726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,256,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,32,0.0033724444607893624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,128,0.01166133334239324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,64,0.011767999993430244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,65536,0.09370044204923843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,32,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,51200,0.07635200023651123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,16384,0.03125422199567159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,12288,0.025389333566029865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,65536,0.11794755193922256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,51200,0.09419288900163438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,10240,0.02235466738541921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,8192,0.016192888220151264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,16384,0.036826666858461164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,12288,0.029743999242782593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,7168,0.014454222387737699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,10240,0.02493422230084737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,6144,0.012599111431174807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,5120,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,8192,0.022680888573328655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,7168,0.020873778396182593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,6144,0.01958488921324412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,3584,0.00906044410334693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,5120,0.018191110756662156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,4096,0.01622488929165734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,2560,0.00757244477669398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,3584,0.015512888630231222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,5120,256,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,2048,0.006554666492674086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,3072,0.014952888091405233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,1536,0.0055440002017551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,1024,0.004520888957712385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,2560,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,768,0.0038897775941424896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,2048,0.013755555782053204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,512,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,1536,0.013170666992664337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,1024,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,768,0.012740444805887012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,128,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,512,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,64,0.003206222214632564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,256,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,5120,10240,0.03181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,32,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,128,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,64,0.0118222220076455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,65536,0.0842755569352044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,4096,32,0.012076444096035428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,51200,0.0695306658744812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,16384,0.030209776428010728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,65536,0.11526666747199164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,12288,0.024346666203604803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,4096,0.010255999863147736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,10240,0.02163022259871165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,16384,0.035191999541388616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,8192,0.015425778097576566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,12288,0.028373334142896865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,7168,0.013553777502642738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,10240,0.024365334047211543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,8192,0.022443556123309668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,5120,0.011000889043013254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,7168,0.020626667473051283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,4096,0.009782222410043081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,6144,0.01926666663752662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,3584,0.008769777913888296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,5120,0.017845332622528076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,4096,0.01611111064751943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,256,0.0032222221295038858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,3584,0.015239111251301236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,2560,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,2048,0.006105777704053455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,3072,0.014454222387737699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,1536,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,2560,0.014098667436175875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,1024,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,2048,0.013479111095269522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,768,0.0039013334446483185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,1536,0.01310755560795466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,512,0.003524444583389494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,1024,0.012455110748608908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,256,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,768,0.0124177775449223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,51200,0.09177866909239028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,128,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,64,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,256,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,32,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,4096,3072,0.008263111114501953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,64,0.011439999772442712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,65536,0.07590755489137438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,32,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,51200,0.06179022126727634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,65536,0.11264533466762966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,16384,0.02535199953450097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,51200,0.09012977944480048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,3072,0.007984889050324758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,12288,0.021811554829279583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,10240,0.018593778212865193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,16384,0.03384622269206577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,12288,0.027879112296634253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,10240,0.02380888826317257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,7168,0.01497688889503479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,8192,0.021537777450349595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,6144,0.012719111310111152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,5120,0.010666666759385003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,7168,0.020233778489960563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,4096,0.009591999981138442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,6144,0.019034667147530448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,3584,0.008343111309740279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,4096,0.015803555647532146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,512,0.012120000190205045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,3072,0.007890666524569193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,2560,0.0069253332912921906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,3584,0.01481244464715322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,2048,0.006872889068391588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3584,6144,0.012307555311255984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,3072,0.014333332578341166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,1536,0.005223111146026188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,2560,0.014085332552591959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,1024,0.004540444248252445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,768,0.004247111164861255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,2048,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,1536,0.013080889152155982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,1024,0.012459555433856117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,768,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,512,0.012092444631788464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,128,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,256,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,8192,0.01631733278433482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,128,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,32,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,64,0.011776000261306763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,32,0.011982222398122152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,51200,0.05297333333227369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3072,5120,0.017542221479945712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,65536,0.110097779168023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,16384,0.02258133391539256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,12288,0.019271110494931538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,51200,0.08804533216688369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,16384,0.03261244297027588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,3584,128,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,8192,0.015199111567603217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,12288,0.027295110954178706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,7168,0.013120888835854001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,10240,0.023735110958417256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,512,0.0039057777159743835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,6144,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,8192,0.021187555458810594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,5120,0.010382222632567087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,4096,0.008969777988062965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,3072,256,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,3584,0.008392000363932716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,6144,0.018539556198649935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,5120,0.016714667280515034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,3072,0.007915555602974361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,2560,0.006568000134494569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,4096,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,3584,0.01483022173245748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,2048,0.005575110928879843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,3072,0.014115555418862237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,2560,0.013752000199423896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,1024,0.004472889006137848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,65536,0.06393955813513862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,768,0.0041991112132867174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,1536,0.01308444473478529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,1024,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,512,0.0038613333470291565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,768,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,256,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,512,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,128,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,256,0.011698666546079846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,10240,0.016843555702103507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,32,0.00314666661951277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,128,0.011378666592968835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,64,0.011431111229790581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,65536,0.05349777804480659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,32,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,51200,0.043848888741599194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,7168,0.019959110352728102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,16384,0.018932445181740653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,12288,0.015506666567590503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,65536,0.10668800274531047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,51200,0.08558755450778538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,16384,0.0318195554945204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,10240,0.01351288871632682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,8192,0.013746666411558786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,12288,0.027016000615225896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,7168,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,10240,0.023330666952663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,6144,0.011357333097192975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,8192,0.020618667205174763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2560,2048,0.013473778135246701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,5120,0.010089777410030365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,4096,0.008903111020723978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,7168,0.0192577772670322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,3584,0.007948444121413762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,3072,0.007276444799370236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,5120,0.01614488826857673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,4096,0.014827556080288358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,2560,0.006250666661394968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,3584,0.014764444695578681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,2048,0.005362666729423735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,1536,0.004855999930037392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,3072,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,1024,0.0041964443193541635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,2048,0.01313333296113544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,1536,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,768,0.0038897775941424896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,512,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,1024,0.012462221913867526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,256,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,768,0.012448888685968188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,128,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,64,0.0028453332682450614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,256,0.012067555553383298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2048,32,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,128,0.011396444506115384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,64,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,65536,0.043281777037514575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,32,0.011753777662913004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,51200,0.03461688756942749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,2560,1536,0.004898666507667965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,16384,0.015206222732861837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,12288,0.013556444810496436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,65536,0.10390310817294651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,51200,0.08283644252353244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,10240,0.012504888905419244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,16384,0.031473779016070895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,8192,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,7168,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,12288,0.0270453327231937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,6144,0.010271111296282874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,8192,0.020294222566816542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,7168,0.018580444984965853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,5120,0.009671111073758867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,4096,0.008373333348168267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,5120,0.016167110866970487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,4096,0.015192000402344598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,3584,0.007253333098358578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,3072,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,512,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,3584,0.014816888504558139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,2560,0.0059004442559348206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,3072,0.014160000615649752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,2048,0.0052586665583981415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,1536,0.004859555512666702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,2560,0.013976888524161445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,2048,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,1536,0.013064000341627332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,768,0.0038942222793896994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,1024,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,512,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,768,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,256,0.0034942221310403612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,6144,0.017901332841979135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,512,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,128,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,10240,0.02295822236273024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,64,0.0028906667398081887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,32,0.002926222152180142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,256,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,65536,0.03239288926124573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,128,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,6144,0.01750666730933719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,32,0.011393778026103973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,65536,0.10043288601769342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,16384,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,51200,0.08000000317891438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,12288,0.014010666145218743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,16384,0.03109688891304864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,10240,0.012533333566453723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,12288,0.025990222891171772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,8192,0.011368888947698804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,10240,0.02162222233083513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,7168,0.01072355525361167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,8192,0.019268444842762418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,6144,0.009630222287442949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,7168,0.018223999275101554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,5120,0.00869422240389718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,6144,0.01718577742576599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,4096,0.00795111142926746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,5120,0.01581333412064446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,2048,2560,0.013765333427323235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,3584,0.0075937774446275495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,4096,0.01478666729397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,3072,0.006633777585294511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,51200,0.025872000389628943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,2560,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,2048,0.005366222312053044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,3584,0.014498665928840637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,3072,0.014084445105658637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,1536,0.0047120000753137796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,2560,0.013776889277829064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,1024,0.004043555508057277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,2048,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,768,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,512,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,1536,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,256,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,1024,0.01221777747074763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,128,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,64,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,512,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1024,32,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,256,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,1536,1024,0.004219555606444676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,128,0.011393778026103973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,65536,0.027432888746261597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,64,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,51200,0.022266666094462078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,32,0.011529777612951068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,12288,0.011916444533401065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,65536,0.09840622213151719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,51200,0.07818400197558932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,10240,0.010978666444619497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,8192,0.010036444498433007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,12288,0.02444800072246128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,7168,0.009639110830095079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,10240,0.02160444524553087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,6144,0.00867733359336853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,8192,0.01958311100800832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,5120,0.007756444315115611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,7168,0.018193778064515855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,4096,0.007995555798212687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,6144,0.01717511150572035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,3584,0.00777422222826216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,5120,0.016200888488027785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,3072,0.00655644428398874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,4096,0.014793778459231058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,2560,0.005722666780153911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,3584,0.014496889379289416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,2048,0.00519466648499171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,3072,0.014133334159851074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,1536,0.00453244439429707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,2560,0.013746666411558786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1024,768,0.01236977759334776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,2048,0.013068444199032254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,768,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,1536,0.01313511116637124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,512,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,1024,0.012383999923865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,16384,0.01368533323208491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,256,0.0031386667655573953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,768,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,512,0.012298666768603854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,64,0.002565333412753211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,128,0.011357333097192975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,32,0.0028026666906144884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,64,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,65536,0.02084355552991231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,32,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,1536,64,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,51200,0.01681066718366411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,16384,0.011055111057228513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,65536,0.09647022353278266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,12288,0.009314667019579146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,51200,0.07614133093092176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,16384,0.029494222667482164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,12288,0.02437688906987508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,8192,0.008631111019187504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,7168,0.008301333420806462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,10240,0.021384888225131567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,1024,0.0038986665507157645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,6144,0.007709333466158972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,8192,0.01941866676012675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,7168,0.018208889497650992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,6144,0.017038222816255357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,4096,0.007600888609886169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,768,128,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,5120,0.016159999701711867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,16384,0.030838221311569214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,4096,0.014713777436150445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,3072,0.006252444452709622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,2560,0.005937777873542573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,3584,0.014787554740905762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,2048,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,3072,0.013815110756291283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,1536,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,2560,0.013767999907334646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,1024,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,2048,0.013413333230548434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,768,0.003567999849716822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,1536,0.012741333080662621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,512,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,1024,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,256,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,10240,0.009760888914267222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,128,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,512,0.012038222617573209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,64,0.0025395556456512874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,256,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,32,0.002842666581273079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,128,0.011420444481902652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,65536,0.016301333904266357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,64,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,5120,0.00870311094654931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,32,0.011407111254003314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,16384,0.009637333452701569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,65536,0.09393866856892903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,512,3584,0.007251555720965068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,12288,0.008338666624493068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,51200,0.07299644417232938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,16384,0.028794666131337483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,768,256,0.011424000064531961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,10240,0.011355555719799466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,8192,0.009720889230569204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,7168,0.009263111485375298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,6144,0.008685333033402761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,12288,0.024103111690945093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,10240,0.02162577708562215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,8192,0.01886666648917728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,7168,0.018179555733998615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,4096,0.007635555333561367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,6144,0.016976000534163583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,5120,0.015956444872750174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,3072,0.006269333263238271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,4096,0.014562666416168213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,3584,0.014689778288205465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,3072,0.014104000396198697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,512,768,0.012449777788586087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,2048,0.005240889059172736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,2560,0.013759111364682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,1536,0.004545777622196409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,1024,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,2048,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,1536,0.01276266657643848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,768,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,512,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,1024,0.012448000411192576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,51200,0.014013333453072442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,768,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,512,0.012191111014948951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,128,0.002797333316670524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,64,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,256,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,32,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,128,0.011361777782440186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,64,0.011601777540312873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,65536,0.015462223026487561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,256,32,0.011094222466150919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,51200,0.01497155593501197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,5120,0.008610666626029545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,16384,0.009322666459613377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,12288,0.00997688869635264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,3584,0.0069155556460221606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,65536,0.09188977877298991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,10240,0.00868088917599784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,16384,0.028472890456517536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,51200,0.07169155279795329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,8192,0.008282666405042013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,12288,0.024153777294688757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,7168,0.009023110899660323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,2560,0.005566222386227713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,6144,0.008625778059164682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,10240,0.021741333934995864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,5120,0.007628444168302748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,8192,0.018736888964970905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,4096,0.0074417781498697065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,7168,0.01790577835506863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,3584,0.006956444846259222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,3072,0.006284444282452266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,5120,0.015810666812790763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,2560,0.005603555589914322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,4096,0.014553777045673795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,3584,0.014101333088344999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,2048,0.004927111168702443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,3072,0.014103111293580798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,1536,0.004552000098758274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,1024,0.003867555409669876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,2560,0.013713777893119387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,768,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,2048,0.012832889126406776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,256,256,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,1536,0.013119999733236102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,256,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,768,0.012457778056462606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,128,0.0028106667515304354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,512,0.012130666938092975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,64,0.002557333351837264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,128,0.011406222151385413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,64,0.011468444433477191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,65536,0.014816888504558139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,32,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,51200,0.014072888427310519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,65536,0.09124266439014012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,16384,0.009357333183288574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,51200,0.07146044572194417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,12288,0.009657777845859528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,16384,0.0285537772708469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,10240,0.009047110875447592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,12288,0.024047111471494038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,8192,0.008059555457697975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,10240,0.021406221720907424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,128,512,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,7168,0.007640889121426477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,1024,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,6144,0.008351999852392409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,8192,0.019150222341219585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,5120,0.007702222300900354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,4096,0.0069919998447100324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,7168,0.017608000172509086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,256,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,6144,0.01688799924320645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,3584,0.006639110959238476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,5120,0.015799999237060547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,2560,0.0064604443808396654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,4096,0.014875556031862894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,2048,0.005934222290913264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,3584,0.014462222655614218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,3072,0.013583111266295115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,1536,0.004564444637960858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,1024,0.003605333467324575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,2048,0.013408888545301227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,1536,0.012453333371215396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,768,0.003535110917356279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,512,0.003228444399105178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,1024,0.012132444315486483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,256,0.0028844444702068963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,128,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,768,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,512,0.012416000167528788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,64,0.002529777793420686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,256,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,128,6144,0.01686311099264357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,32,0.002530666689078013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,128,0.0107351111041175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,65536,0.024329778220918443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,51200,0.021261332763565913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,64,0.011410666836632622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,32,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,16384,0.009143999881214565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,12288,0.009718221922715506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,65536,0.08939111232757568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,10240,0.00868977771864997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,51200,0.07004444466696845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,8192,0.008296888735559251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,16384,0.02849777870708042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,7168,0.007939555578761632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,12288,0.024039111203617517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,6144,0.00850133349498113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,10240,0.020959110723601446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,5120,0.007731555236710443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,8192,0.018370666437678866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,4096,0.007487110793590546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,7168,0.018220444520314533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,3584,0.00693866651919153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,5120,0.015444444285498725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,64,3072,0.006288888967699475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,2560,0.006018666757477655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,4096,0.014264000786675347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,3584,0.014683556225564746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,2048,0.005596444424655702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,1536,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,3072,0.013442666994200813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,1024,0.0036764442920684814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,64,2560,0.013753777576817406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,2560,0.013424889081054263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,768,0.003532444437344869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,2048,0.013342222405804528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,512,0.003216888962520493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,1536,0.012453333371215396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,256,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,1024,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,768,0.012128888732857175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,128,0.002516444358560774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,512,0.01221866657336553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,256,0.011187555889288584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,32,0.0025439999169773525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,128,0.011015999648306104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,64,0.011392888923486074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,32,0.01074222226937612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,113,32,6144,0.01683555543422699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,3072,0.006636444479227066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,51200,0.6560284296671549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,16384,0.22011821799808076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,16384,0.37170134650336367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,113,32,64,0.002559111143151919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,51200,1.1432906256781685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,12288,0.2791528966691759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,12288,0.1653777758280436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,10240,0.237373325559828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,8192,0.19252888361612955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,8192,0.11831111378139919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,12288,0.23034932878282335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,7168,0.17013333903418648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,10240,0.19663643836975098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,16384,0.30624267790052623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,7168,0.10161777999666001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,10240,0.13937332895067003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,6144,0.1455271111594306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,5120,0.12295822302500407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,8192,0.16043555736541748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,6144,0.08931733502282037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,5120,0.07613777452045016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,4096,0.10159199767642552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,4096,0.06413688924577501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,3584,0.08800888723797268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,7168,0.14372355408138698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,6144,0.12777511278788248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,3584,0.05816977553897434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,3072,0.07644799682829115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,4096,0.09696000152164036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,5120,0.1119226614634196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,2560,0.06395644611782499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,3584,0.08797511127259995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,2048,0.051826665798823036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,3072,0.05139822098943922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,2560,0.04593777656555176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,1536,0.04077333211898804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,2048,0.041159109936820135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,3072,0.08026844263076782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,1024,0.02978666623433431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,1536,0.03388888968361749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,768,0.022487110561794702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,1536,0.055664890342288546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,2048,0.06447377469804552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,1024,0.04961955547332764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,512,0.01555999947918786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,768,0.0448017782635159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,768,0.024056888288921777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,512,0.020610666937298246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,256,0.01036800030204985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,512,0.0398960014184316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,128,0.008212444682916006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,256,0.033781333102120295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,128,0.02906844351026747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,64,0.008656889200210571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,128,0.01790844400723775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,65536,32,0.008617777791288164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,64,0.01755199995305803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,32,0.021831999222437542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,2560,0.07112266620000203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,1024,0.028106666273540918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,65536,0.6830897861056857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,65536,1.1005502276950412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,65536,256,0.018876444962289598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,16384,0.2808951006995307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,51200,0.5227280192905003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,51200,0.867561764187283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,65536,51200,0.9476168950398763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,12288,0.2133493291007148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,16384,0.17821510632832846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,12288,0.13452888859642878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,10240,0.1136782169342041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,8192,0.13520088460710314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,8192,0.09644444121254815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,7168,0.11733422014448379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,7168,0.08306222491794162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,10240,0.16670666800604927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,16384,0.25446311632792157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,6144,0.1018257803387112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,8192,0.14087200164794922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,12288,0.1965022219551934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,6144,0.0736151138941447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,5120,0.08595022228029038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,10240,0.1662542157702976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,5120,0.06300533480114408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,4096,0.07238933112886217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,3584,0.06214577621883816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,4096,0.053451554642783276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,7168,0.12504533926645914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,6144,0.11198577615949844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,5120,0.09769244326485528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,4096,0.08530222045050727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,3584,0.04888177911440531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,3584,0.07787377966774835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,2560,0.0467582212554084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,3072,0.04351377818319532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,2048,0.03887733485963609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,2560,0.03905511233541701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,3072,0.07191199726528592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,1536,0.030177778667873804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,2560,0.06495110856162177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,2048,0.03548533386654324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,2048,0.058118224143981934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,1024,0.023881778120994568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,1536,0.02990844514634874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,1536,0.05118311113781399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,768,0.01719466679626041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,1024,0.024911999702453613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,1024,0.04497333367665609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,512,0.012421333127551608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,768,0.021577777134047613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,768,0.04095022214783563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,256,0.009311999711725447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,512,0.018639999959203932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,512,0.036333332459131874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,128,0.0064560001095136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,3072,0.05510400070084465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,256,0.017640888690948486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,256,0.032264000839657254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,64,0.005208000126812193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,51200,32,0.005576000031497743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,128,0.016164445214801364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,128,0.026434666580624048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,64,0.018530666828155518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,65536,0.33744533856709796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,51200,32,0.01921422282854716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,65536,0.27686932351854115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,51200,0.2630782127380371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,16384,0.08575377861658733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,16384,0.0788853300942315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,51200,0.2146444453133477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,12288,0.06758577956093682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,51200,0.812396420372857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,12288,0.06109955575731066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,10240,0.056977775361802846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,16384,0.08836978011661106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,10240,0.05123644404941135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,8192,0.04730044470893013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,12288,0.07231911023457845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,7168,0.0400622222158644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,8192,0.04425422350565592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,10240,0.06587821907467313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,51200,65536,1.0421173307630751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,6144,0.035860445764329694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,7168,0.03980799847178989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,8192,0.05511555406782362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,5120,0.030808889203601416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,7168,0.051048888100518115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,4096,0.02643111182583703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,5120,0.03165422214402093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,6144,0.048009776406817965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,5120,0.04306044512324863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,6144,0.03832888934347365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,3584,0.022945778237448797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,4096,0.028194665908813477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,3072,0.02016177773475647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,51200,0.21795733769734701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,65536,0.27281689643859863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,3584,0.026388444834285315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,2560,0.017478222648302715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,3072,0.0236799998415841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,2048,0.0144177774588267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,3072,0.036093334356943764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,1536,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,2560,0.033089776833852134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,2560,0.02125866711139679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,2048,0.03183555603027344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,1024,0.009282666775915358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,2048,0.019912888606389362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,768,0.007631999750932057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,1536,0.030826667944590252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,1536,0.018245332770877414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,1024,0.02903199858135647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,1024,0.01643288963370853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,768,0.015167999598715039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,768,0.026942221654786006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,256,0.004311111238267687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,512,0.02371911042266422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,512,0.014099554883109199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,128,0.0038853333228164246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,256,0.01313244468635983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,64,0.003839111162556542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,128,0.019561777512232464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,128,0.012446222205956778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,32,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,64,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,16384,32,0.014120888378885059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,65536,0.2432924376593696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,4096,0.03969066672854953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,65536,0.2241013314988878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,3584,0.03904533386230469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,51200,0.18785511122809517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,51200,0.17447377575768364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,16384,0.06413333283530341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,16384,512,0.00620888877246115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,12288,0.05019111103481717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,16384,0.06550311379962497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,16384,256,0.022667555345429316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,12288,0.05163200034035576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,10240,0.04259999924235874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,16384,0.08001422219806247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,12288,0.06633510854509142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,8192,0.03569066524505615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,10240,0.057787557442982994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,7168,0.030751999881532457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,8192,0.037696000602510236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,10240,0.04320889049106174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,8192,0.05215822325812446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,7168,0.03411022159788344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,65536,0.24275554551018608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,5120,0.023806222611003455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,7168,0.047600001096725464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,6144,0.03105777833196852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,4096,0.020601777566803824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,6144,0.04475555486149258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,5120,0.04061422083112929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,3584,0.017571555243598092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,4096,0.023411555422676936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,3072,0.015786666009161208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,3584,0.02237422267595927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,3584,0.03606044583850437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,2560,0.013442666994200813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,3072,0.020638222495714825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,3072,0.03471555643611484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,2048,0.011779555843936073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,2560,0.019497777024904888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,2560,0.032928887340757586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,1536,0.00962577760219574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,2048,0.018395556343926322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,2048,0.03087555699878269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,1024,0.008099555969238281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,1536,0.029913776450686987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,1024,0.014444443914625378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,768,0.006603555546866522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,6144,0.027173333697848853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,51200,0.19515911738077799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,512,0.004924444274769889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,768,0.013759111364682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,768,0.0243484444088406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,256,0.004535111288229625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,5120,0.02751111156410641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,512,0.02314577831162347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,512,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,128,0.0041644444896115195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,256,0.02199111051029629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,64,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,128,0.019300444258583915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,12288,32,0.0039057777159743835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,64,0.012421333127551608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,32,0.013108444710572561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,65536,0.20398933357662627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,1536,0.01681777834892273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,65536,0.21597511238522002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,1024,0.027929776244693335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,51200,0.1567200024922689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,16384,0.05393244491683113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,51200,0.16869510544670951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,12288,4096,0.03727911247147454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,12288,0.04296355446179708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,16384,0.06309333112504747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,256,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,12288,128,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,10240,0.036088890499538846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,16384,0.07773422532611422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,12288,0.04969333277808296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,8192,0.030629333522584703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,10240,0.04213066564665901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,12288,0.06451200114356147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,7168,0.026315554976463318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,10240,0.05669244130452474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,6144,0.02328444520632426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,8192,0.05022933416896396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,7168,0.033139556646347046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,51200,0.187645329369439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,5120,0.020094222492641874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,7168,0.04623200164900886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,6144,0.02996888756752014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,65536,0.23340710004170737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,4096,0.017329777280489605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,6144,0.04328622089491951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,3584,0.014871110518773397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,5120,0.02591288917594486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,5120,0.04001599881384108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,4096,0.02292177743381924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,3072,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,3584,0.021690666675567627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,2560,0.011447110937701331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,3584,0.03513066636191474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,2048,0.010257778068383535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,3072,0.02049688829316033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,2560,0.03277955452601115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,2560,0.01921333372592926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,1536,0.008662222160233391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,2048,0.018114666144053142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,2048,0.03127377894189622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,1024,0.0069466663731469055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,1536,0.01612355477280087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,1536,0.02951999836497837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,768,0.005584888988071018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,1024,0.015107555521859063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,1024,0.025033776958783466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,512,0.004538666870858935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,8192,0.03685155510902405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,768,0.013927999469969006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,768,0.02574133376280467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,256,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,512,0.013080000049538083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,512,0.023016000787417095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,128,0.003547555456558863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,256,0.02195288903183407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,256,0.01275644451379776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,64,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,10240,32,0.0035626664757728577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,128,0.019567999574873183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,128,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,64,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,10240,32,0.013071999781661563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,4096,0.03680000040266249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,65536,0.1794382201300727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,51200,0.14244266351064047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,10240,3072,0.03416000141037835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,16384,0.048510223627090454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,65536,0.1708773374557495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,12288,0.03803022371398078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,51200,0.13357510831620958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,16384,0.05298133360015022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,10240,0.0322106679280599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,12288,0.041751109891467623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,8192,0.02743822170628442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,16384,0.07179111242294312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,12288,0.06117510795593262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,7168,0.02383199996418423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,8192,0.030607110924190942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,10240,0.05359289050102234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,6144,0.020855110552575853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,8192,0.04837422238455879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,7168,0.02797422144148085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,7168,0.04438044296370613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,5120,0.017993777990341187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,6144,0.0255395554833942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,51200,0.17396622233920625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,6144,0.04186311033036974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,4096,0.01574577722284529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,3584,0.01407199932469262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,5120,0.022077333596017625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,65536,0.21631022294362387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,5120,0.038613332642449275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,4096,0.03620533479584588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,3072,0.01272266689274046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,4096,0.020576889316240948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,3584,0.0347324444188012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,2560,0.011056889262464313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,3584,0.019324445062213473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,3072,0.033562666840023465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,2560,0.01738844480779436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,2560,0.03163199954562717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,1536,0.00832711077398724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,2048,0.016343999240133498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,2048,0.03050311075316535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,1024,0.0063475556671619415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,1536,0.01443199978934394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,1536,0.02772533396879832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,768,0.0052693333062860705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,1024,0.025077333052953083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,512,0.004537777768241035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,768,0.012770666844315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,768,0.024335111180941265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,10240,0.03529599971241421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,256,0.0038293335172865125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,512,0.012448888685968188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,512,0.023013333479563396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,128,0.0038319999972979226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,256,0.02165866725974613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,256,0.012256888879670037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,64,0.003555555724435382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,32,0.0038124442928367188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,128,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,64,0.012527999778588613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,32,0.012488889197508493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,65536,0.16128622161017522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,51200,0.12827111615075007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,8192,2048,0.00998222248421775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,51200,0.132149338722229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,1024,0.01402666668097178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,16384,0.05116800136036343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,65536,0.21359199947781035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,51200,0.17224533028072783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,8192,128,0.019606222709019978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,12288,0.035644445154401995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,16384,0.07147377729415894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,12288,0.04083555605676439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,12288,0.06078844600253635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,65536,0.16876622041066489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,10240,0.033952001068327166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,8192,0.02604977786540985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,10240,0.05312711000442505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,7168,0.02237066626548767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,8192,0.030071109533309937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,8192,0.04768888817893135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,6144,0.019447111421161227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,16384,0.04985688792334663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,7168,0.027277333868874445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,7168,0.044234666559431285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,5120,0.016768889294730294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,6144,0.02457333273357815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,6144,0.04200889004601372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,4096,0.014797333214018079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,5120,0.03850133220354716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,3584,0.012081777883900536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,4096,0.02000977761215634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,4096,0.03636088967323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,3072,0.011222222612963783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,3584,0.01921688848071628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,10240,0.029831111431121826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,3584,0.034196443027920194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,2560,0.009737778041097853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,3072,0.033497777250077986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,3072,0.018592889110247295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,2048,0.008623999853928884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,2560,0.017183999220530193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,1536,0.007592889169851939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,8192,3072,0.018569777409235638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,2048,0.03057066599527995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,1024,0.0058142224119769196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,1536,0.014422222971916199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,1536,0.0281057788266076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,768,0.004929777648713854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,1024,0.013458666702111563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,512,0.004517333375083076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,1024,0.02571644385655721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,768,0.024380443824662104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,256,0.004171555654870139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,512,0.024338665935728285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,256,0.012040889097584618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,256,0.022287999590237934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,128,0.003536888708670934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,5120,0.021951999929216173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,64,0.003559111307064692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,128,0.019242667489581637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,128,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,7168,32,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,64,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,32,0.012796444197495779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,7168,2560,0.03081511126624213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,65536,0.16240889496273464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,2048,0.016201777590645682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,51200,0.10740800036324395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,16384,0.04361244373851352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,51200,0.1284631093343099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,768,0.013067555924256643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,16384,0.04953866534762912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,12288,0.035918222533331975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,12288,0.03883466786808438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,10240,0.024475556280877855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,65536,0.2113564411799113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,12288,0.06003377834955851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,8192,0.021189333664046392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,10240,0.03319999906751845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,10240,0.05288088983959622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,8192,0.028824888997607764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,7168,0.018239999810854595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,8192,0.04732977681689792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,6144,0.01578044394652049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,7168,0.02604888876279195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,7168,0.04389511214362251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,5120,0.013901333014170328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,6144,0.02392622166209751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,6144,0.04083022144105699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,4096,0.01256622208489312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,5120,0.021706667211320665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,5120,0.03779644436306424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,3584,0.011000889043013254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,4096,0.020248000820477802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,4096,0.035616000493367515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,7168,512,0.012461333639091916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,3072,0.009858667022652095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,3584,0.018935999936527677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,3584,0.03405155407057868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,2560,0.008967999782827165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,16384,0.07091199689441256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,3072,0.033265779415766396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,2048,0.007937777373525832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,51200,0.17025778028700086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,2560,0.030491554074817236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,1536,0.006584888945023219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,2048,0.03046222196684943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,2048,0.015789333317014907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,1024,0.005201777650250329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,1536,0.014175999495718213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,1536,0.027085334062576294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,768,0.004629333400064045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,65536,0.13239999612172446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,1024,0.013418667018413544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,1024,0.02570044497648875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,512,0.0042453333735466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,768,0.012910222013791403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,768,0.023974221613672044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,256,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,512,0.012749333348539142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,128,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,256,0.02167111138502757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,256,0.01202755586968528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,64,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,128,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,128,0.019536889261669584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,6144,32,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,64,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,32,0.012161778079138862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,65536,0.11567466788821751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,51200,0.09380000167422825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,3072,0.018198221921920776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,65536,0.15847467051612005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,6144,2560,0.01704266667366028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,16384,0.03801777627733018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,12288,0.030527111556794908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,16384,0.047863112555609814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,51200,0.12521421909332275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,10240,0.02683199942111969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,16384,0.07060533099704318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,12288,0.0373342235883077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,8192,0.01924977699915568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,12288,0.05963200330734253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,6144,512,0.02398666739463806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,10240,0.03201777736345927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,65536,0.2096195618311564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,7168,0.016618667377365958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,51200,0.16886844899919298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,6144,0.014696000350846184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,8192,0.02742044462098016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,8192,0.04650577902793884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,5120,0.013028444515334235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,7168,0.04310311211480034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,6144,0.0406915545463562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,4096,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,6144,0.023710222707854375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,5120,0.0370782216389974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,3584,0.010261333651012844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,5120,0.021327111456129286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,3072,0.00964355551534229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,4096,0.035078220897250705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,3584,0.03367288907368978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,3584,0.01851466629240248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,2560,0.008571555217107138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,3072,0.01738222274515364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,3072,0.032680001523759626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,2048,0.007621333003044128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,2560,0.015480000111791821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,1536,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,2048,0.027387556102540758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,1536,0.013800889253616333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,1536,0.02570844524436527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,1024,0.004932444542646408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,1024,0.024673778149816725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,1024,0.013119999733236102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,768,0.004573333180612988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,10240,0.051911999781926475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,512,0.0041759999261962045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,768,0.012720888687504662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,7168,0.025407999753952026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,512,0.022653333014912073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,256,0.003528000166018804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,512,0.012423999607563019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,128,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,256,0.022357333037588332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,4096,0.019952888290087383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,256,0.012034667034943899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,64,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,128,0.011410666836632622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,5120,32,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,128,0.020622221959961783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,64,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,32,0.012082666986518435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,2560,0.030185778935750324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,65536,0.09322310818566217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,5120,2048,0.014764444695578681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,51200,0.0768080022599962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,65536,0.11720089117685954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,16384,0.0322106679280599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,12288,0.0258586671617296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,51200,0.0939520001411438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,16384,0.03630400035116408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,16384,0.0706311133172777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,12288,0.028916445043351915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,12288,0.05908888578414917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,8192,0.016238222519556682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,51200,0.16702044010162354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,5120,768,0.02367466688156128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,65536,0.20854932732052275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,10240,0.05203377869394091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,7168,0.014863999353514777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,8192,0.04647199975119697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,8192,0.022988445229000513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,7168,0.042352000872294106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,7168,0.020803555846214294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,6144,0.01254488858911726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,5120,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,6144,0.04014666544066535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,6144,0.01978400018480089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,5120,0.018245332770877414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,5120,0.03756711218092177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,4096,0.010379555324713389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,3584,0.008961777720186446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,4096,0.034985777404573225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,3072,0.008719999757077958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,3584,0.033950222863091364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,3072,0.03170933326085409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,3072,0.014955555399258932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,2560,0.007480888730949826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,2560,0.030179556873109605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,10240,0.02277066641383701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,2048,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,2048,0.013447110851605734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,2048,0.027798222170935735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,1536,0.005385777602593104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,1536,0.013120888835854001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,1536,0.025723555021815833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,1024,0.004495111190610462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,1024,0.025403555896547105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,768,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,4096,0.016827555166350473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,768,0.012544000314341651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,3584,0.0159582214223014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,512,0.0035546666218174826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,768,0.02369155486424764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,256,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,512,0.02421866688463423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,512,0.012092444631788464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,128,0.003293333368168937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,256,0.022034666604465906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,256,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,2560,0.014139556222491793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,64,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,128,0.011426666544543372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,4096,32,0.002995555599530538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,4096,128,0.019871999820073444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,64,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,65536,0.08418577909469604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,32,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,51200,0.0683457785182529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,65536,0.1141857835981581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,16384,0.029155555698606703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,51200,0.09215466843711005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,12288,0.024209777514139812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,1024,0.012713777522246042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,16384,0.03533777925703261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,16384,0.06972177823384602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,10240,0.021506667137145996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,12288,0.028129776318868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,12288,0.058562669489118785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,65536,0.2076666620042589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,8192,0.015048889650238885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,51200,0.16725422276390922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,7168,0.013730666703648038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,10240,0.024706666668256123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,10240,0.05121244324578179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,8192,0.021969777014520433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,6144,0.012094222009181976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,8192,0.04563555452558729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,7168,0.042769776450263135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,5120,0.011018666956159802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,7168,0.020627554919984605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,4096,0.009983110758993361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,6144,0.040291554398006864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,5120,0.01794399983353085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,3584,0.008954666554927826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,5120,0.036743111080593534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,3072,0.007983999947706858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,4096,0.034345779154035784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,4096,0.016185777054892648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,3584,0.031544887357287936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,2560,0.007246221933099959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,3584,0.01511111193233066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,4096,10240,0.025027554896142747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,2048,0.0062773335311147906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,3072,0.032623999648623996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,2560,0.027798222170935735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,1536,0.005141333159473208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,2560,0.014471999473041959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,1024,0.004519111166397731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,2048,0.02816533380084568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,2048,0.013464888764752282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,1536,0.026407111022207472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,768,0.0039057777159743835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,1536,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,512,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,1024,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,1024,0.02536800007025401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,768,0.02427911096149021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,768,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,512,0.023316444622145757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,512,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,128,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,256,0.011432888607184092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,256,0.022129777404997084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3584,128,0.019138667318556044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,32,0.0028799999919202593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,64,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,6144,0.019694222344292533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,32,0.011382222175598145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,65536,0.07436711258358426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,51200,0.06105244159698486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,65536,0.11223110887739395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,3072,0.014797333214018079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,51200,0.08985600206587051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,16384,0.025342222717073228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,65536,0.20708799362182617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,16384,0.033760001262029014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,16384,0.06913510958353679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,12288,0.021526222427686054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3584,256,0.0035626664757728577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,51200,0.16664444075690374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,10240,0.018499554859267343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,8192,0.016647110382715862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,12288,0.027790221903059218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,12288,0.05857155720392863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,10240,0.02432800001568264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,10240,0.05111644334263272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,7168,0.014828445182906257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,6144,0.011811555259757571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,8192,0.02165511084927453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,8192,0.04593866732385424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3584,128,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,7168,0.020432889461517334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,6144,0.01890222231547038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,5120,0.017852443787786696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,5120,0.03745955559942458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,4096,0.034972445832358465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,3584,0.008570666942331526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,3584,0.01540177729394701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,3072,0.007838221887747446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,3072,0.014495111174053617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,3072,0.03053511182467143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,2560,0.007110222346252865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,2560,0.01387288918097814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,7168,0.04254755708906385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,2048,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,2560,0.02814133299721612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,6144,0.039719998836517334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,4096,0.009639110830095079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,1536,0.0058204444746176405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,2048,0.027830223242441814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,2048,0.013463111387358772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,1024,0.004535111288229625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,1536,0.025369778275489807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,4096,0.015810666812790763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,1536,0.01276177747382058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,768,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,512,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,1024,0.01278222186697854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,768,0.023373333944214716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,768,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,256,0.0035004446076022256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,512,0.02334844403796726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,512,0.011887999872366587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,128,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,256,0.02161688937081231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,256,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,64,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,128,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,128,0.020239111449983384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,32,0.002871111035346985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,64,0.011387555963463254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,65536,0.061478224065568715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,3072,32,0.011344888971911537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,51200,0.05211111240916782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,65536,0.11008710993660821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,16384,0.02200355629126231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,51200,0.08751999669604832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,3072,5120,0.010718222293588849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,12288,0.018575110369258456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,16384,0.03251555562019348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,10240,0.016345777445369296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,12288,0.027434666951497395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,65536,0.20744000540839302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,8192,0.014707555373509726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,10240,0.023582221733199224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,10240,0.05121422145101759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,1024,0.025480000509156123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,7168,0.013109332985348172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,8192,0.021225778592957392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,8192,0.04572000106175741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,6144,0.01256622208489312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,7168,0.04241333405176798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,7168,0.019998222589492798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,5120,0.010306666294733683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,6144,0.03975111246109009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,6144,0.0188719994492001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,5120,0.017328000730938382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,5120,0.03707022137112088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,4096,0.015122666954994202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,4096,0.033258666594823204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,3584,0.00832266691658232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,3584,0.03110044532352024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,3584,0.014864888456132678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,3072,0.007553777760929531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,3072,0.014431110686726041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,16384,0.06867555777231853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,2560,0.007275555696752336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,12288,0.05802488989300198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,2048,0.005948444621430502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,2560,0.028134223487642076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,2048,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,1536,0.004889777965015835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,3072,3584,0.03156088789304098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,1536,0.013027555412716336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,4096,0.00924444446961085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,1024,0.01239733315176434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,1024,0.02439022229777442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,768,0.004184000194072723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,768,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,3072,0.030254221624798242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,512,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,51200,0.16663111580742732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,2560,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,512,0.02370577719476488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,256,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,2048,0.02808444367514716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,256,0.020985777179400127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,128,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,1536,0.0255422227912479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,128,0.020411555965741474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,128,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,64,0.0028479999552170434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,32,0.0031395554542541504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,65536,0.052914665804968945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,64,0.011715555356608497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,32,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,51200,0.04371644390953911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,65536,0.1054133309258355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,51200,0.08529155784183079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,16384,0.019208888212839764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,65536,0.2070737812254164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2560,768,0.023711111810472276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,51200,0.16616000069512263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,12288,0.0159608887301551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,16384,0.03155288762516446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,16384,0.06866844495137532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,512,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,10240,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,8192,0.013414222333166333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,12288,0.0269822229941686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,12288,0.05773778094185723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,10240,0.051233778397242226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,10240,0.023383999864260357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,7168,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2560,256,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,6144,0.01146933353609509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,8192,0.02074666652414534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,8192,0.04506399896409777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,5120,0.01033155537313885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,7168,0.042484445704354175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,7168,0.019381332728597853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2560,1024,0.004229333251714706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,6144,0.03843999902407328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,4096,0.00889511075284746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,6144,0.018170666363504197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,3584,0.008051555189821456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,5120,0.01647733317481147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,5120,0.0351493325498369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,3072,0.0074826669361856245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,4096,0.03257866700490316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,4096,0.014831110835075378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,3584,0.031354665756225586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,3584,0.014783999986118741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,2048,0.005585777676767773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,3072,0.03009422289000617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,3072,0.013935999737845527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,1536,0.004585777719815572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,2560,0.027294221851560805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,2560,0.013745778136783175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,1024,0.004249777644872665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,2048,0.013403555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,2048,0.027087999714745417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,768,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,1536,0.025762667258580525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,512,0.0035208890007601846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,1024,0.01241422196229299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,768,0.02404888967672984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,768,0.012433778080675336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,256,0.003206222214632564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,512,0.011946666571829053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,512,0.022618666291236877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,128,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,256,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,256,0.022015111313925848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,64,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,32,0.0028524444335036804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,128,0.011422221859296164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,64,0.011769777370823754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,65536,0.04298488961325752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,32,0.012123555772834353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,65536,0.1035004456837972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,51200,0.03479289015134176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,2048,2560,0.006476444502671559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,65536,0.20695200231340197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,51200,0.08280799786249797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,2048,1536,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,51200,0.1655422184202406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,16384,0.031209776798884075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,1024,0.024692444337738886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,12288,0.013962666193644205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,10240,0.012787555654843649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,16384,0.0684915582338969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,12288,0.026670222481091816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,12288,0.05738400088416206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,8192,0.011499555574523078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,10240,0.022630222969584998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,10240,0.05048977666431003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,7168,0.01107377807299296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,2048,128,0.019398222366968792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,8192,0.020233778489960563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,8192,0.04531733194986979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,6144,0.010281778044170803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,5120,0.00965244405799442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,7168,0.041013333532545306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,7168,0.018903111418088276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,4096,0.008368888662921058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,6144,0.037696888049443565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,6144,0.017472000585661996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,3584,0.007423111134105259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,5120,0.03456977672047085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,5120,0.016161777906947665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,3072,0.00675999994079272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,4096,0.014827556080288358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,4096,0.03240799903869629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,2560,0.005873777800136142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,3584,0.014440889159838358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,3072,0.03015111221207513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,2048,0.005255110975768831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,3072,0.014144000079896716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,2560,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,1536,0.004869333157936732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,16384,0.014912888407707214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,2048,0.02684088879161411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,1024,0.0042151109211974675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,2048,0.013120888835854001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,1536,0.026428444517983332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,1536,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,1024,0.012124444047609964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,512,0.0035004446076022256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,768,0.012366222010718452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,512,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,256,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,256,0.011696000066068439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,256,0.021299555897712708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,128,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,128,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,2560,0.02812444501452976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,128,0.019336000084877014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,64,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,32,0.0031431110368834603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1536,768,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,64,0.011178666518794166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,65536,0.03188088867399428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1536,32,0.011076444553004371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,768,0.02401422295305464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,51200,0.02492888934082455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,65536,0.1000231107076009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,512,0.023715555667877197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,16384,0.013047999805874295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,51200,0.0797920028368632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,65536,0.20727645026312935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,51200,0.1659297810660468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,16384,0.06821155548095703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,10240,0.01254666679435306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,12288,0.02608888844648997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,10240,0.021948445174429152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,10240,0.05034133460786608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,8192,0.011409777734014722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,3584,0.03094044327735901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,8192,0.01926399932967292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,7168,0.01071999967098236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,8192,0.043531556924184166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,6144,0.010594666832023196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,7168,0.040031999349594116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,7168,0.0185253338681327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,5120,0.009679111341635386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1536,1024,0.02475999957985348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,6144,0.037316444847318865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,4096,0.008056888977686564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,5120,0.015876443849669564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,5120,0.034421334664026894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,3584,0.007178666690985362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,4096,0.03219555483924018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,12288,0.014139556222491793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,3072,0.006587555425034628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,3584,0.014767999450365702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,3584,0.030566222137875024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,16384,0.03105866577890184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,2560,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,12288,0.05651999844445122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,3072,0.014107555150985718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,2048,0.005589333259397083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,2560,0.013471999930010902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,2560,0.02806666824552748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,1536,0.004554666578769684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,2048,0.013136000268989138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,1536,0.012755555411179861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,1536,0.025360888904995386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,1024,0.004230222354332606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,1024,0.024004444479942322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,6144,0.017270222306251526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,1024,0.01219377749496036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,768,0.003839111162556542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,512,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,768,0.024004444479942322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,512,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,256,0.003198222153716617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,512,0.022635555929607813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,4096,0.014783999986118741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,128,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,256,0.011407111254003314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,256,0.020925333102544148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,64,0.0028880000528362063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,128,0.01108444482088089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,128,0.018858666221300762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,1024,32,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,3072,0.03016977839999729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,65536,0.027165333429972332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,64,0.011355555719799466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,51200,0.022737777895397607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,1024,2048,0.027356444133652583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,65536,0.0935973326365153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,16384,0.01387644476360745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,65536,0.20619732803768584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,51200,0.16657422648535833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,12288,0.012467555701732635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,16384,0.03038311004638672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,16384,0.06735733482572767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,10240,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,12288,0.05624533361858792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,12288,0.02475822303030226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,8192,0.01033155537313885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,10240,0.04864177770084805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,7168,0.009368889033794403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,768,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,8192,0.019327110714382596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,8192,0.04316444529427422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,6144,0.008302222523424361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,7168,0.039423998859193586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,5120,0.00795022232664956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,6144,0.03766399953100417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,5120,0.015857777661747403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,5120,0.034930666287740074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,4096,0.007763555480374231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,1024,32,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,4096,0.01513066722287072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,3584,0.006924444602595435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,51200,0.07790578073925443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,3584,0.014492443866199918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,3072,0.00657155571712388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,3072,0.029806223180558946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,3072,0.014159111513031853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,2560,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,10240,0.02193333374129401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,2560,0.013791999883121915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,2048,0.0052888890107472735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,2048,0.027460444304678176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,2048,0.013062222136391534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,1536,0.004654222064548069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,6144,0.017159110969967313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,1024,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,1536,0.012793777717484368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,1024,0.02421244482199351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,1024,0.012341332932313284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,768,0.0037768888804647657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,4096,0.03193511234389411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,512,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,768,0.023020444644822016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,768,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,256,0.0031822222388452957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,3584,0.030844443374209937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,512,0.022996443841192458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,512,0.011770666473441653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,128,0.0028808888875775864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,256,0.011415999796655444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,128,0.019215111931165058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,768,32,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,64,0.011085333095656501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,2560,0.02786933382352193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,65536,0.021016889148288306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,32,0.011386666860845355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,51200,0.01664622293578254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,7168,0.018561777141359117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,65536,0.09603910975986057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,16384,0.011012444065676795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,65536,0.2061377763748169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,51200,0.07562666469150119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,1536,0.02641333308484819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,12288,0.009673777553770278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,51200,0.16590578026241726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,16384,0.029116445117526587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,16384,0.06611733304129706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,10240,0.010034666293197209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,12288,0.024339555038346186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,8192,0.008903111020723978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,12288,0.055213332176208496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,10240,0.021390222840838965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,7168,0.009631111390060848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,8192,0.04348088966475593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,8192,0.019333332777023315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,6144,0.00867733359336853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,7168,0.017856889300876193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,7168,0.04008177916208903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,768,256,0.020948444803555805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,5120,0.008003555238246918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,6144,0.017183999220530193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,768,128,0.011368888947698804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,4096,0.007368889119890001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,5120,0.01551555593808492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,5120,0.03461600012249417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,3584,0.0069884442620807225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,4096,0.014615999327765571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,4096,0.03294310967127482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,3072,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,3584,0.03051555487844679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,3584,0.014478221535682678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,2560,0.005614222337802251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,3072,0.029763556189007227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,3072,0.014112888111008538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,2048,0.005223999834722943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,1536,0.004579555657174853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,2560,0.02851466668976678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,2560,0.01328888866636488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,1024,0.003903999924659729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,2048,0.027792887555228338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,2048,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,768,0.0035075553589397003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,1536,0.025736888249715168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,1024,0.025241777300834656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,1024,0.012090666426552666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,512,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,768,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,768,0.025047111842367385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,10240,0.04850044515397814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,512,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,512,0.02337155573897892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,128,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,256,0.020960888928837244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,64,0.002528888897763358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,128,0.018627555833922494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,128,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,32,0.0028515555378463534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,65536,0.016568000117937725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,64,0.011083555718262991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,512,6144,0.036983112494150795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,32,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,51200,0.018631999691327412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,65536,0.09321777688132392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,16384,0.010033778018421596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,51200,0.07314933008617826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,65536,0.20555467075771758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,12288,0.01035911093155543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,16384,0.028460443019866943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,16384,0.06555022133721246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,10240,0.009356444080670675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,12288,0.02400711178779602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,1536,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,12288,0.05433244506518046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,8192,0.00832266691658232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,10240,0.02145066691769494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,7168,0.007948444121413762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,8192,0.018753778603341844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,8192,0.04308977723121643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,512,256,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,6144,0.008959111240175035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,7168,0.018208889497650992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,7168,0.03940444522433811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,512,256,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,6144,0.016846223009957206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,6144,0.0373306671778361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,4096,0.007306666837798224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,5120,0.034607112407684326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,5120,0.015800888339678448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,3584,0.0069520001610120135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,4096,0.014850666125615438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,4096,0.031854222218195595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,3072,0.006554666492674086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,3584,0.014510222607188754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,3584,0.03143111202451918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,2560,0.005551110953092575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,3072,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,3072,0.029839999145931665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,2048,0.005211555709441503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,51200,0.16517778237660727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,2560,0.013791110780504016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,1536,0.004522666749027041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,2048,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,2048,0.026906667484177485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,1024,0.003863111138343811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,1536,0.013096888860066732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,1536,0.025024889243973628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,768,0.0035626664757728577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,1024,0.012225777738624148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,10240,0.04822311136457655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,1024,0.024830222129821777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,512,0.0032346666687064697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,768,0.011799111134476133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,768,0.023357333408461675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,256,0.0031351111829280853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,512,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,128,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,256,0.02092444399992625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,256,0.011065777805116443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,5120,0.007807999849319458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,256,32,0.0024906665914588505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,128,0.011768889096048145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,65536,0.015303111738628812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,64,0.01089511149459415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,256,32,0.011031111081441244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,51200,0.01309511148267322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,65536,0.09100177552964951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,65536,0.2056008842256334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,51200,0.07123021947013007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,2560,0.02780533168050978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,51200,0.16509955459170872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,16384,0.028304888142479792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,12288,0.009679999616410997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,12288,0.05468089050716824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,12288,0.0239955551094479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,10240,0.009062222308582729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,512,0.02230577833122677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,10240,0.021197333931922913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,10240,0.0481315553188324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,8192,0.00812977800766627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,7168,0.008113777471913232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,256,128,0.018868444694413077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,8192,0.01887999971707662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,8192,0.043474667602115206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,6144,0.007262222468852997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,7168,0.017895999881956313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,5120,0.0069671107663048645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,7168,0.03906222184499105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,6144,0.017183999220530193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,6144,0.036728888750076294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,4096,0.007286222444640265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,5120,0.015527110960748462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,5120,0.03391199972894456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,3584,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,4096,0.014441778262456259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,4096,0.03256977929009332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,16384,0.009703999592198266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,3072,0.006584888945023219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,2560,0.006252444452709622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,3584,0.030603554513719346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,3072,0.02928000026279026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,3072,0.014223999447292753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,16384,0.06562755505243938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,2048,0.006213333457708359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,1536,0.004511111312442356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,2560,0.01311555587583118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,2560,0.02776266634464264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,1024,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,2048,0.027453333139419556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,2048,0.013442666994200813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,768,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,1536,0.025469332933425903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,1024,0.023982221881548565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,1024,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,768,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,256,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,512,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,256,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,256,0.02091911103990343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,128,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,128,0.019920888874265883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,128,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,64,0.0028453332682450614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,32,0.002504000026318762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,64,0.011003555523024665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,65536,0.014764444695578681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,32,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,51200,0.014025777578353882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,3584,0.014089778065681458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,16384,0.008632000121805403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,65536,0.0902364452679952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,12288,0.008283555507659912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,51200,0.07090489069620769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,10240,0.007634667058785756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,128,1536,0.012445333103338877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,8192,0.006924444602595435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,128,512,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,12288,0.024002666274706524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,10240,0.0214373336897956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,6144,0.006672888994216919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,768,0.024008888337347243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,5120,0.006248000181383557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,8192,0.018568888306617737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,112,128,512,0.022639999787012737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,7168,0.017847999930381775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,4096,0.0062773335311147906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,3584,0.006258666515350342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,6144,0.01719555589887831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,5120,0.015800888339678448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,3072,0.005746666755941179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,2560,0.006264888991912206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,4096,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,2048,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,3584,0.014074666632546319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,1536,0.004252444538805219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,1024,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,2560,0.013189333180586496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,768,0.0035004446076022256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,2048,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,1536,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,512,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,256,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,1024,0.0123831108212471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,128,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,512,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,64,0.002522666628162066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,128,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,32,0.0024871110088295406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,64,0.010716444088353051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,65536,0.014129777749379476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,32,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,16384,0.028112000889248315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,51200,0.013624889155228933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,16384,0.00867022242810991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,64,7168,0.0069146665434042616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,65536,0.08955466747283936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,12288,0.008119111259778341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,51200,0.06958488623301189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,10240,0.007602666815121968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,16384,0.028425776296191748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,8192,0.007080000307824876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,7168,0.006640888750553131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,12288,0.0236453331179089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,6144,0.006177777631415262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,10240,0.02092622220516205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,8192,0.019229332605997723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,7168,0.017903111047214933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,3072,0.014146667387750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,4096,0.006597333484225803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,6144,0.01647200021478865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,3584,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,5120,0.015805333852767944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,3072,0.006284444282452266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,2560,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,4096,0.014845333165592618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,3584,0.013971555564138623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,768,0.011753777662913004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,2048,0.005935110979610019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,3072,0.014103111293580798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,2560,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,64,256,0.011155555645624796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,2048,0.012772444221708508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,768,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,1536,0.013048888908492194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,512,0.0031999999450312722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,256,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,1024,0.012406222522258759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,128,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,768,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,64,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,512,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,32,0.002550222186578645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,256,0.011139555937714048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,128,0.011360000405046674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,64,0.0107342220014996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,112,32,32,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,5120,0.005965333431959152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,16384,0.2191235621770223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,16384,0.37333422236972386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,12288,0.2865804566277398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,10240,0.2103066709306505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,51200,0.6426400078667535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,12288,0.16148355272081164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,1536,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,112,32,1024,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,8192,0.17461866802639434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,7168,0.15199732780456543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,7168,0.10044355524910821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,10240,0.13762311140696207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,51200,1.1409289042154949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,5120,0.11000177595350479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,4096,0.09011555380291408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,5120,0.07546844747331408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,3584,0.07950133085250854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,6144,0.08828977743784587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,3584,0.05766666597790188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,2560,0.05853333075841268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,3072,0.06951289044486152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,3072,0.05138311121198866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,2048,0.04861066738764445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,2560,0.04602400130695767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,1536,0.037407110134760536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,1024,0.02914666798379686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,2048,0.040772444672054715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,1536,0.03363022208213806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,1024,0.03365866674317254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,512,0.01477599971824222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,768,0.02808711263868544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,256,0.009341333475377824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,512,0.022293332550260756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,6144,0.13000088267856175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,128,0.008284444610277811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,256,0.0191928893327713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,64,0.005948444621430502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,32,0.006225777582989798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,128,0.017909333109855652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,64,0.017536888519922893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,32,0.01938311093383365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,4096,0.06355022059546576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,65536,768,0.021451556020312842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,65536,0.6724168989393445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,16384,0.28099200460645885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,65536,8192,0.11742311053805882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,51200,0.8668515417310926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,51200,0.5123448901706272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,65536,1.1051653756035698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,16384,0.17580089304182264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,12288,0.2115866608089871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,10240,0.19507111443413627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,12288,0.13127466042836508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,10240,0.1117111047108968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,8192,0.0958942241138882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,7168,0.14018400510152182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,6144,0.12085155646006267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,5120,0.1017928918202718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,4096,0.08237066533830431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,3584,0.07280977567036946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,7168,0.08228266901440091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,5120,0.06219910913043552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,4096,0.05329422156016032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,6144,0.07295822434955172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,3584,0.048635555638207324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,2048,0.04375911090109083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,3072,0.043304890394210815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,1536,0.03378044565518697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,2560,0.053082668119006686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,1024,0.024707555770874023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,1536,0.029666665527555678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,768,0.019024888674418133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,512,0.013831111292044321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,1024,0.029651555750105116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,768,0.02422222163942125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,256,0.008712000317043727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,128,0.0058604445722368025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,512,0.019759999381171334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,8192,0.1591448916329278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,64,0.0052168890833854675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,256,0.01752355529202355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,32,0.0052586665583981415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,128,0.016136889656384785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,32,0.017789334058761597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,65536,0.3355768786536322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,51200,3072,0.0639680027961731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,65536,0.270668453640408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,64,0.01889600025282966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,16384,0.08732622199588352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,51200,0.26172977023654515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,12288,0.06786844465467665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,10240,0.05593599875768026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,16384,0.07622577746709187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,51200,0.20873688326941597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,12288,0.05749333567089505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,2048,0.035014222065607704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,7168,0.04114044374889798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,10240,0.05046400096681383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,5120,0.030757334497239854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,51200,2560,0.03905422157711453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,7168,0.03911644551489089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,8192,0.044623110029432506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,4096,0.026345777842733595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,6144,0.03537066777547201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,3584,0.02256177696916792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,3072,0.019893333315849304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,5120,0.03150755498144362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,2560,0.016857778032620747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,4096,0.026919111609458923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,2048,0.01408088869518704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,3584,0.025384000606007043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,1536,0.01145600030819575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,3072,0.023246222072177466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,1024,0.009210666848553551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,2560,0.021558221843507554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,2048,0.01977155605951945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,1536,0.018236445056067575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,512,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,1024,0.01794399983353085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,256,0.0041848888827694785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,128,0.003839111162556542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,512,0.01464355488618215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,256,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,64,0.0031964443624019623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,32,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,64,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,8192,0.048152890470292836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,32,0.012944888737466602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,6144,0.035565333233939275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,65536,0.24560978677537706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,65536,0.21704888343811035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,51200,0.1875128878487481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,16384,0.06447111235724555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,16384,768,0.0074133334888352295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,12288,0.05018577641910977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,51200,0.16881867249806723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,10240,0.0422417786386278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,8192,0.036044445302751325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,16384,0.06397510899437799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,768,0.016169778174824186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,12288,0.04792355497678121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,7168,0.03118488854832119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,5120,0.02401155564520094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,6144,0.02730400032467312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,16384,128,0.012777778009573618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,8192,0.03775022096104092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,7168,0.03351644343800015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,10240,0.042436444097095065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,4096,0.019876443677478366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,3584,0.017839110559887357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,6144,0.030597332451078627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,3072,0.01573244399494595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,5120,0.025938666529125635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,2048,0.0120319997270902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,4096,0.023022222850057814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,1536,0.009764444496896531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,2560,0.013737777868906656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,3584,0.0221742226017846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,1024,0.008268444074524773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,3072,0.020607110526826646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,2560,0.01956888867749108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,768,0.0069120000633928515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,512,0.005197333378924264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,2048,0.018212444252438016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,256,0.004562666846646203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,1536,0.016913778252071805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,1024,0.015525332755512662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,64,0.0035573335157500375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,768,0.014783110883500842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,512,0.01369866645998425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,32,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,256,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,128,0.01276266657643848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,64,0.012443555725945367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,12288,32,0.012509333590666452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,16384,0.054641776614718966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,65536,0.2070124414232042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,51200,0.15773155954149035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,12288,0.042781333128611244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,10240,0.03585422370168898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,65536,0.20921777354346383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,16384,0.06135911411709256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,8192,0.03050044510099623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,7168,0.026719111535284255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,6144,0.023473777704768713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,10240,0.04111999935574002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,8192,0.036229332288106285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,7168,0.032163557079103254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,6144,0.029402666621738013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,4096,0.01772799922360314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,5120,0.02565244502491421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,3584,0.015593777100245157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,3072,0.013516444298956128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,4096,0.022639999787012737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,2560,0.011968889170222811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,3584,0.02162666618824005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,2048,0.01054222219520145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,3072,0.02051555613676707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,1536,0.008623110751310984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,2560,0.019104000594880845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,12288,128,0.004176889028814104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,1024,0.007139555282062954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,2048,0.017823111679818895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,768,0.005879111174080107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,512,0.0046302220887608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,1536,0.016146666473812528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,256,0.0039057777159743835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,1024,0.01481244464715322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,768,0.01444355481200748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,128,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,64,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,512,0.013134222063753339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,32,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,256,0.012712889247470431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,128,0.012087999946541257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,51200,0.16342133945888943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,64,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,32,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,10240,12288,0.046718223227394946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,65536,0.1838853359222412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,16384,0.050253334972593516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,51200,0.14194666014777288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,65536,0.16706577936808267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,12288,0.03963022099600898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,51200,0.12969777319166395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,16384,0.050103111399544605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,10240,0.0329422222243415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,8192,0.028706666496064927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,12288,0.03867644402715895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,10240,0.03422933485772874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,6144,0.021634666456116572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,7168,0.02439466615517934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,5120,0.018626666731304593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,8192,0.030329777134789362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,7168,0.02695200012789832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,4096,0.015948444604873657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,3584,0.014081777797804939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,6144,0.024339555038346186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,3072,0.012724444270133972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,4096,0.020241777102152508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,5120,0.02198311189810435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,3584,0.01923644377125634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,2048,0.010025777750545079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,1536,0.00829777783817715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,3072,0.018191999859280057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,1024,0.006544888847404056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,2560,0.01744888888465034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,2048,0.015895111693276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,768,0.005215999980767568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,1536,0.01482222146458096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,512,0.004555555681387584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,256,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,1024,0.01442577772670322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,768,0.013811555173661975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,512,0.013188444077968597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,256,0.012121777567598553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,64,0.003216888962520493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,32,0.0035377778112888336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,128,0.011776888536082374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,10240,5120,0.020558221472634208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,64,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,8192,32,0.012560000022252401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,65536,0.16208799680074057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,51200,0.1282106637954712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,16384,0.04750577939881218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,65536,0.1632888846927219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,12288,0.03746755586730109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,51200,0.1268435584174262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,10240,0.03142755561404758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,16384,0.04931288957595825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,8192,0.02693155573474036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,12288,0.03738044367896186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,7168,0.023564444647894964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,2560,0.011009777585665384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,10240,0.0332897769080268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,6144,0.020572443803151447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,8192,0.02957333458794488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,5120,0.01774577796459198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,7168,0.02643377747800615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,3584,0.012196444802814059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,4096,0.01533422205183241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,5120,0.021719111336602107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,6144,0.023844444089465674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,4096,0.020261334048377145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,2560,0.00977600034740236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,3584,0.019161777363883126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,2048,0.008707555631796518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,8192,128,0.0034826666944556763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,1536,0.00793333351612091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,3072,0.018094221750895183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,1024,0.0058871110280354815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,2560,0.017321777012613084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,768,0.005220444252093633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,512,0.004575110971927643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,1536,0.01441333360142178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,1024,0.01443199978934394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,256,0.003930666794379552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,128,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,512,0.012857777376969656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,64,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,256,0.01221155540810691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,128,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,32,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,64,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,32,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,65536,0.14345867104000515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,51200,0.1145342191060384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,65536,0.15690133306715223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,16384,0.04376799861590067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,51200,0.12247733275095622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,12288,0.0366284449895223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,7168,3072,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,16384,0.04816533459557427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,12288,0.036327110396491155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,8192,0.021574222379260596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,7168,0.018611555298169453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,10240,0.03228977653715346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,6144,0.016622222132152982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,8192,0.028753777345021565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,5120,0.014477334088749357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,7168,0.025421332981851365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,4096,0.013153778182135688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,2048,0.015528000063366361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,3584,0.011789333489206104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,6144,0.023364444573720295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,3072,0.010667555862002902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,5120,0.02160266704029507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,7168,768,0.014150222142537435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,4096,0.019567999574873183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,2560,0.009564444422721863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,3584,0.018929777873886954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,2048,0.0086666668454806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,3072,0.017882666654056974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,1536,0.007246221933099959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,1024,0.005550222264395819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,768,0.0052168890833854675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,2560,0.016561778055297006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,2048,0.015142222245534262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,1536,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,512,0.004230222354332606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,1024,0.013823111024167804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,256,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,128,0.0035075553589397003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,768,0.013554666605260638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,512,0.01295555548535453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,32,0.0032462223122517266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,256,0.012416000167528788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,128,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,64,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,6144,32,0.012088889049159156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,65536,0.11600177817874485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,51200,0.09268533521228367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,16384,0.035868446032206215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,12288,0.030250665214326646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,65536,0.1520586676067776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,10240,0.026886221435334947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,6144,10240,0.033752888441085815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,16384,0.0467582212554084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,51200,0.11996622880299886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,8192,0.023289778166347083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,12288,0.03559733430544535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,6144,0.01439377831088172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,10240,0.03180177675353156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,8192,0.027684445182482403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,7168,0.024708444873491924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,4096,0.011354666617181567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,6144,0.023223999473783705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,3584,0.011249778171380361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,5120,0.021410667233996924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,3072,0.009995555712117089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,2560,0.008952889177534316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,4096,0.01955200069480472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,2048,0.008277333445019191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,3584,0.01868266695075565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,1536,0.006227555374304454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,3072,0.01719199948840671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,1024,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,2048,0.014888889259762235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,768,0.004861333303981357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,1536,0.014286221729384528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,512,0.004231111043029361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,1024,0.013834666874673633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,256,0.003532444437344869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,768,0.013340444200568728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,128,0.0031902222997612427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,512,0.01295555548535453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,256,0.012081777883900536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,128,0.011736888852384357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,32,0.0031964443624019623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,64,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,65536,0.09228266610039605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,7168,0.016499555773205228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,32,0.011352889239788055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,5120,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,51200,0.0756675534778171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,16384,0.03080444534619649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,12288,0.026001777913835313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,51200,0.08858311176300049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,65536,0.11144267188178168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,16384,0.03487022386656867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,10240,0.023099554909600153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,8192,0.016131555040677387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,12288,0.02757955590883891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,7168,0.014515555567211576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,10240,0.024364444944593642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,5120,2560,0.016159110599093966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,8192,0.02236355510022905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,5120,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,7168,0.020356444848908316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,4096,0.010712888505723743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,3584,0.009326222042242685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,5120,0.017549332645204332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,3072,0.008388444781303406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,4096,0.01647733317481147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,2560,0.007589333587222629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,5120,64,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,3072,0.014755555325084262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,2560,0.014105778601434497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,1536,0.005544888890451855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,2048,0.013426666458447775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,1024,0.004583999928500918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,1536,0.013150222599506378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,768,0.004182222402758068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,1024,0.012835555606418185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,768,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,512,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,6144,0.012981333666377597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,512,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,256,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,128,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,64,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,6144,0.019479110836982727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,256,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,32,0.0031884445084465873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,128,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,64,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,3584,0.015454222758611044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,65536,0.08867110808690389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,4096,32,0.011389333340856763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,16384,0.029581334855821397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,4096,2048,0.006627555522653792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,65536,0.10889689127604167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,12288,0.023551111419995625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,16384,0.0337413317627377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,51200,0.08695555395550197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,10240,0.021487111846605938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,8192,0.016175111134847004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,7168,0.013782222237851886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,6144,0.012198222180207571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,10240,0.023707555400000677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,8192,0.02160888910293579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,5120,0.010809777511490716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,7168,0.0199644449684355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,4096,0.00999022192425198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,6144,0.018820444742838543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,3584,0.009000889129108852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,3072,0.008269333177142674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,5120,0.017504000001483493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,2560,0.007254222200976477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,3584,0.015618667006492615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,3072,0.014311111635631986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,2048,0.006261333409282897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,1536,0.005286222116814719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,2560,0.013802666631009845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,1024,0.004273777620659934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,2048,0.013431111143694984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,1536,0.013280889226330651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,768,0.0038862224254343244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,512,0.0038204445607132385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,1024,0.01277955538696713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,256,0.003519999898142285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,768,0.0127697777416971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,512,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,128,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,256,0.011687999798191918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,51200,0.07096178001827665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,64,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3584,32,0.0030168888883458245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,128,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,65536,0.07735021909077962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,64,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,32,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,12288,0.026203556193245783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,51200,0.06298400296105279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,16384,0.02494311167134179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,12288,0.02091911103990343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,65536,0.10644088851081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,10240,0.017851556340853374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,16384,0.03267733256022135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,8192,0.01685688893000285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,12288,0.025729777084456548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,7168,0.014714666538768344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,6144,0.014075555735164218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,10240,0.02335111134582096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3584,4096,0.015857777661747403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,5120,0.01072266697883606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,7168,0.01995022263791826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,8192,0.021406221720907424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,4096,0.009763555394278632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,3584,0.008616888688670265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,6144,0.018527110417683918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,3072,0.007700444095664554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,5120,0.01721333298418257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,2560,0.007809778054555257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,4096,0.01551644504070282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,2048,0.006903999795516332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,3584,0.014831999937693277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,1536,0.00591111100382275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,3072,0.014088888963063559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,1024,0.004943999979231092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,2560,0.013772444592581855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,768,0.004564444637960858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,512,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,2048,0.013441777891582914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,1536,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,256,0.003536888708670934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,1024,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,128,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,768,0.012724444270133972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,64,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,512,0.012488889197508493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,3072,32,0.0031848889258172777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,128,0.011375111010339526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,64,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,65536,0.06654577785068087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,32,0.011760888828171624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,51200,0.05427999960051643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,16384,0.02196177840232849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,65536,0.10400888654920791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,51200,0.0826444427172343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,51200,0.08473689026302761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,10240,0.01686844395266639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,16384,0.031720889939202204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,12288,0.025120000044504803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,8192,0.014730667074521383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,7168,0.013980444934633044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,10240,0.022896000080638464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,6144,0.012539555629094442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,7168,0.019651555352740817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,5120,0.011585777832402123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,4096,0.009353777600659264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,6144,0.018193778064515855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,3584,0.008056888977686564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,5120,0.01684177749686771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,4096,0.01515111161602868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,3072,0.00739911115831799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,2560,0.006568888823191325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,3584,0.014840000205569796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,2048,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,3072,0.0144177774588267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,1536,0.005249777601824866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,2560,0.013813333378897773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,3072,256,0.011693333586057028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,1024,0.004512888689835866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,768,0.004021333323584663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,2048,0.01313333296113544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,512,0.0038311113086011675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,1536,0.01313066648112403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,256,0.0035413333939181436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,768,0.013032889200581444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,128,0.0031395554542541504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,512,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,64,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,12288,0.0188719994492001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2560,32,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,128,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,64,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,65536,0.054562668005625405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,32,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,51200,0.04485244552294413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,8192,0.02075111038155026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,16384,0.018529777725537617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,65536,0.10013866424560547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,12288,0.015121777852376303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,10240,0.013396444420019785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,16384,0.030863109562132094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,8192,0.012410666379663678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,12288,0.024694222542974684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,7168,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,8192,0.020336000455750358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,6144,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,7168,0.01887911061445872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,5120,0.00997155573632982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,6144,0.017255110873116385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,1024,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,4096,0.008954666554927826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,3584,0.007937777373525832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,5120,0.01592266725169288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,3072,0.00723555518521203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2560,256,0.011782222323947482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,4096,0.01483022173245748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,2560,0.006223111102978389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,3584,0.01481599940194024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,2048,0.005554666535721884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,1536,0.004851555658711327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,3072,0.014112000664075216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,1024,0.00407644444041782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,768,0.003653333418899112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,2560,0.013934221532609729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,2048,0.013111111190583972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,512,0.003519999898142285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,1536,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,256,0.0031902222997612427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,128,0.002965333354141977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,768,0.012788444757461548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,64,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,512,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,256,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,2048,32,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,51200,0.08022577895058526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,128,0.011736888852384357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,65536,0.04228444563017952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,64,0.011698666546079846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,32,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,16384,0.016065778003798593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,10240,0.02288977801799774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,12288,0.01447111037042406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,10240,0.013059555656380124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,65536,0.09720177782906426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,51200,0.07750666803783841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,8192,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,7168,0.011232888533009423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,12288,0.024344889654053584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,10240,0.022218666142887537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,6144,0.011055111057228513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,8192,0.019552888141738046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,5120,0.01035377797153261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,7168,0.018610666195551556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,4096,0.008277333445019191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,6144,0.01683288812637329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,3584,0.007272889216740926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,5120,0.015542222393883599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,3072,0.006575111299753189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,4096,0.01478844384352366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,2560,0.005903111149867375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,3584,0.014779556128713818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,2048,0.0052764444715446895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,3072,0.013815999858909182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,1536,0.004862222406599256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,2048,1024,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,1024,0.004202666795916027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,2048,0.01314222233162986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,768,0.003891555385457145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,1536,0.0127688886390792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,512,0.003540444291300244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,1024,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,256,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,51200,0.03436177637841966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,768,0.012786666552225748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,128,0.0028479999552170434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,64,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,256,0.011692444483439127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,128,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1536,32,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,16384,0.03040177623430888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,64,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,65536,0.031110223796632554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,51200,0.025424000289705064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,32,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,16384,0.012861332959598966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,12288,0.013791999883121915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,51200,0.07441511419084337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,16384,0.02991022335158454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,10240,0.012487110992272695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,8192,0.01146577795346578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,12288,0.02367466688156128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,7168,0.010198222266303169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,10240,0.020969778299331665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,6144,0.010822222464614444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,7168,0.01793866687350803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,5120,0.009338666995366415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,6144,0.016604445046848722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,4096,0.00795288880666097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,5120,0.015839111473825242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,3584,0.007296000089910295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,4096,0.015012444721327888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,3072,0.006577777779764599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,512,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,2560,0.005894222193294101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,3584,0.014547554983033074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,2048,0.006319111006127463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,3072,0.014104889498816596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,1536,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,2560,0.01369511087735494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,1024,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,1536,0.01309866706530253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,768,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,1024,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,512,0.0037253333462609183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,256,0.0031822222388452957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,768,0.012729778057999082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,128,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,8192,0.018869333797030978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,256,0.011698666546079846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,64,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1536,2560,0.013739555246300168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,128,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,65536,0.02477333280775282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,64,0.011067555182509951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,51200,0.02197155521975623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,32,0.01073333372672399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,16384,0.014350222216712104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,65536,0.09194755554199219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,51200,0.07209599680370755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,12288,0.011848889291286469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,16384,0.02942488922013177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,10240,0.011063111325105032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,8192,0.010100444157918295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,12288,0.022617777188618977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,10240,0.020595555504163105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,7168,0.009329777624871995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,2048,0.013456888496875763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,65536,0.09389244185553657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,7168,0.01757688820362091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,5120,0.007630222373538547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,6144,0.01683911184469859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,4096,0.00776622196038564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,3584,0.007328000333574083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,5120,0.015466666883892484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,3072,0.006229333165619109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,4096,0.014863111906581454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,2560,0.0059368887709246735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,3584,0.014486221803559197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,2048,0.005249777601824866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,1024,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,3072,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,1536,0.004554666578769684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,2560,0.013768889009952545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,1024,0.003875555677546395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,2048,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,768,0.003567111161020067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,1024,0.012430222498046027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,512,0.00318755561278926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,768,0.012443555725945367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,256,0.0031840000301599503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,512,0.01240355521440506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,128,0.0028808888875775864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,256,0.011537777880827585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,8192,0.018886221779717337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,128,0.011742221812407175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,32,0.002564444517095884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,64,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,65536,0.020607999629444547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,32,0.011040888726711273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,51200,0.016506666938463848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,1024,512,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,16384,0.011002666420406766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,65536,0.0897902250289917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,12288,0.00924355536699295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,51200,0.07008177704281278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,16384,0.027854220734702215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,10240,0.00979288915793101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,8192,0.008651555412345463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,12288,0.022796443767017786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,7168,0.009372444616423713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,10240,0.020377778344684176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,6144,0.009702222214804756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,8192,0.018930666976504855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,5120,0.008647999829716152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,7168,0.017859554953045316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,4096,0.00759733302725686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,6144,0.016203555795881484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,5120,0.015834665960735746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,6144,0.008667555948098501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,4096,0.014827556080288358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,3072,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,3584,0.014502222339312235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,2560,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,2048,0.0052720002002186244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,3072,0.014144000079896716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,1536,0.004575110971927643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,2560,0.013788444300492605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,1024,0.004224888980388641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,2048,0.012828444441159567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,768,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,1536,0.012776888906955719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,512,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,1024,0.012423999607563019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,256,0.0031911111954185697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,768,0.012088889049159156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,128,0.002883555574549569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,512,0.012101333174440594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,64,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,768,1536,0.012787555654843649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,64,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,65536,0.016827555166350473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,3584,0.00692622239391009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,65536,0.08683288759655422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,51200,0.01889866590499878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,768,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,16384,0.009941333697901832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,12288,0.009931555224789513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,51200,0.06821955574883355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,16384,0.027454222242037456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,10240,0.009001777403884465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,12288,0.02234933276971181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,8192,0.008614222208658854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,7168,0.009078222016493479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,10240,0.02058844433890449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,6144,0.008642666869693333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,8192,0.018255111243989732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,7168,0.017514665921529133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,6144,0.016249777542220224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,4096,0.007256000406212277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,5120,0.015472888946533203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,256,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,3584,0.0069057775868309875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,128,0.011128000087208219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,3072,0.006217777729034424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,2560,0.005623111294375525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,4096,0.014442667365074158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,2048,0.005200888961553574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,512,32,0.010703110860453712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,3072,0.013442666994200813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,1536,0.00453599997692638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,2560,0.013750221994188098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,1024,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,768,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,2048,0.012792000340090858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,1536,0.01276266657643848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,1024,0.01238844460911221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,768,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,512,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,128,0.0028026666906144884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,256,0.011423110961914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,128,0.01108000013563368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,64,0.0025475554996066624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,5120,0.008622222476535374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,64,0.01073155552148819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,65536,0.014920888675583733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,32,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,512,32,0.002532444480392668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,51200,0.013414222333166333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,16384,0.009319999979601966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,256,3584,0.014540443817774454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,12288,0.010029333333174387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,51200,0.06650844547483656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,16384,0.026946667167875502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,10240,0.008984000318580205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,8192,0.008279999925030602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,512,0.0031991110493739447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,12288,0.023031999667485554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,7168,0.008988444175985124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,10240,0.020226667324701946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,6144,0.008286221987671321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,256,256,0.003144888828198115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,5120,0.007706666986147563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,8192,0.018602665927675035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,4096,0.0069324444565508105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,7168,0.017875555488798354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,3584,0.0069324444565508105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,6144,0.016162667009565566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,5120,0.015563555889659457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,4096,0.014832889040311178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,2560,0.005867555737495422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,3584,0.014522666732470194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,3072,0.013528889252079858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,1536,0.00452622233165635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,2560,0.013812444276279874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,2048,0.013452444639470843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,1536,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,768,0.0034906665484110513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,1024,0.012482666307025485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,512,0.0031991110493739447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,256,0.0028942223224374983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,768,0.012120889292822944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,512,0.011769777370823754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,128,0.002603555512097147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,64,0.0025537777692079544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,256,0.011905777785513135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,32,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,128,0.010998222563001843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,64,0.01073688848151101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,65536,0.014547554983033074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,32,0.011066666907734342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,51200,0.013748444616794586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,16384,0.009016888837019602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,65536,0.08348533180024888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,12288,0.009311111436949836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,3072,0.006237333433495627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,16384,0.027064000566800434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,10240,0.00867377801073922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,8192,0.007761778102980719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,2048,0.004906666775544484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,12288,0.022291556000709534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,7168,0.007634667058785756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,10240,0.02030044462945726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,6144,0.007304000357786815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,8192,0.0184871107339859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,5120,0.007190222541491191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,128,1024,0.0038319999972979226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,4096,0.007263999846246507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,7168,0.017234666479958426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,3584,0.006950221955776215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,6144,0.016186666157510545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,3072,0.006568888823191325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,5120,0.015171556009186639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,4096,0.01478488908873664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,2048,0.005946666830115848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,3072,0.013467555244763693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,1536,0.0042364444169733255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,2560,0.013204444613721637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,128,65536,0.08386311266157363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,2048,0.013067555924256643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,1024,0.003559111307064692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,768,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,512,0.003297777846455574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,1536,0.012439111040698158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,256,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,1024,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,768,0.012293332980738746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,128,0.0024862223201327855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,512,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,256,0.011352000137170156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,128,0.01073688848151101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,32,0.00253866674999396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,64,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,65536,0.022336888644430373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,51200,0.06564888689253065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,51200,0.01960444450378418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,32,0.01068800025516086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,16384,0.009023110899660323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,12288,0.009371555513805812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,65536,0.08309777577718098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,51200,0.06505066818661161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,10240,0.008974221845467886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,16384,0.027106665902667578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,8192,0.008283555507659912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,12288,0.022322666313913133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,10240,0.0206657780541314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,8192,0.018424888451894123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,6144,0.007309333317809635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,2560,0.00629066675901413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,5120,0.006953777538405524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,7168,0.017512889371977914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,4096,0.007520000139872233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,3584,0.006949333681000604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,6144,0.016158221496476066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,5120,0.015477332803938123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,3072,0.006248000181383557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,4096,0.014468444718254937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,3584,0.014534221755133735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,2048,0.006252444452709622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,3072,0.013760888742076026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,1536,0.004514666481150521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,2560,0.013397333522637686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,1024,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,64,64,0.0024764444679021835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,2048,0.013166222307417126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,768,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,512,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,1536,0.012853333519564735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,256,0.002934222213096089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,1024,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,128,0.0027991111079851785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,768,0.012606222596433429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,64,0.00250133333934678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,512,0.011767110890812345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,128,0.01096088853147295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,64,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,32,0.01036888857682546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,7168,0.007954667011896769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,64,3584,0.013948443863126965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,97,32,2560,0.005960000058015187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,16384,0.3729955620235867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,16384,0.2175884379280938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,51200,0.6409529050191244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,12288,0.27707110510932076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,12288,0.16195733017391628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,51200,1.1437608930799696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,97,32,256,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,10240,0.20851377646128336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,10240,0.1375511089960734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,8192,0.17412177721659342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,7168,0.15102577209472656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,8192,0.11735288302103679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,7168,0.1002604431576199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,6144,0.1295093297958374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,12288,0.22878665394253203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,6144,0.08831022183100383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,8192,0.15733244684007433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,7168,0.1419902245203654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,5120,0.10955555571450128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,16384,0.30039821730719674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,10240,0.19155200322469076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,4096,0.09460355838139851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,5120,0.07524177763197157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,3584,0.07958577738867866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,4096,0.0632257792684767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,3072,0.06957599851820204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,3584,0.05748089154561361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,3072,0.051182223690880664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,2560,0.058113780286577016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,6144,0.12565333313412136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,5120,0.11144977145724827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,4096,0.09488977988560994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,2048,0.04775199956364102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,1536,0.037321776151657104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,2560,0.04567022124926249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,2048,0.04075288772583008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,3072,0.07932177517149183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,3584,0.08714133501052856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,2560,0.07098844316270617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,1024,0.029626667499542236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,2048,0.06390844451056586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,768,0.021309332715140447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,1536,0.03390577766630385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,512,0.014543111125628153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,1024,0.02907022171550327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,1024,0.04857244425349765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,256,0.009010666774378883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,768,0.024490666058328416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,768,0.04425155454211765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,128,0.008027555214034187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,512,0.03887110948562622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,256,0.03421422176890903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,64,0.007040888898902469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,128,0.027423999375767175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,65536,32,0.007096000015735626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,512,0.021514667405022517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,64,0.017549332645204332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,32,0.02093066606256697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,65536,0.6718088785807291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,1536,0.05624710851245456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,65536,1.0972355736626518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,256,0.01920977731545766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,65536,128,0.017512000269360013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,16384,0.27903734313117134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,16384,0.17535911666022408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,51200,0.5126079983181423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,51200,0.8580204645792643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,12288,0.21052000257703993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,12288,0.13123288419511583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,10240,0.17277244726816812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,10240,0.11158755090501572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,65536,51200,0.9595911237928602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,8192,0.14067467053731283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,8192,0.1006044414308336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,7168,0.12063822481367324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,10240,0.16550578011406794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,8192,0.13734222782982722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,7168,0.08318399720721774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,16384,0.2508142259385851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,6144,0.10590844684176975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,6144,0.07300800085067749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,5120,0.09002844492594402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,5120,0.06283377938800387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,4096,0.07298133108350965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,6144,0.10987022187974717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,3584,0.06334044535954793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,4096,0.05292088786760966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,5120,0.09729155566957261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,3584,0.04863111178080241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,3072,0.0558462209171719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,4096,0.08405511246787177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,12288,0.19297067324320474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,3584,0.07782933447096083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,3072,0.07113333543141682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,2560,0.039317333035998873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,2048,0.03859644465976291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,2560,0.0645973351266649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,1536,0.03005511230892605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,1536,0.029509332444932725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,7168,0.1240053309334649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,2048,0.05853155586454603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,1024,0.022720000810093347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,1536,0.049977779388427734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,768,0.016798221402698092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,1024,0.0259253333012263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,1024,0.044290665123197764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,512,0.01202488856183158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,3072,0.04356177647908529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,768,0.021949332621362474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,2560,0.04669510987069872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,768,0.04117244482040405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,256,0.008835555778609382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,512,0.03586577706866794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,128,0.005631111148330901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,256,0.01737422247727712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,256,0.03252977795071072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,64,0.004584889031118817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,51200,32,0.004969777746333016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,128,0.015809777710172866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,128,0.025403555896547105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,2048,0.03529422150717841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,64,0.016857778032620747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,32,0.018954666124449838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,51200,0.7625857988993326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,65536,0.34158934487236875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,51200,0.2684497833251953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,51200,65536,0.9894231160481771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,16384,0.08887733353508843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,51200,0.208752883805169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,12288,0.06944355699751112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,12288,0.057690666781531445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,10240,0.05747822258207533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,51200,512,0.019903111788961623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,10240,0.05016711023118761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,8192,0.049010667535993785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,12288,0.06799377997716267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,16384,0.08807110786437988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,10240,0.061168001757727734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,7168,0.04268444577852885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,8192,0.04413422279887729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,6144,0.03684355484114753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,7168,0.03925333420435587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,65536,0.27061155107286244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,8192,0.05476266807980008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,5120,0.031856000423431396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,6144,0.03504088852140639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,16384,0.07694844404856364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,5120,0.03147733211517334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,4096,0.027115555273161993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,6144,0.046351999044418335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,3584,0.0236799998415841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,51200,0.2091439962387085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,4096,0.027552000350422327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,65536,0.2659555541144477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,4096,0.03899377915594313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,3584,0.02534577747186025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,3584,0.037478221787346735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,3072,0.023078221413824294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,7168,0.05049333307478163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,2048,0.014676445060306124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,2048,0.01955111159218682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,5120,0.04271911250220405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,1536,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,2048,0.03212622139188979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,2560,0.017432888348897297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,1536,0.017842666970358956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,1024,0.00964355551534229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,1536,0.029880000485314265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,768,0.00797333319981893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,2560,0.02130222154988183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,2560,0.03347200155258179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,1024,0.016528000434239704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,1024,0.02808977829085456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,512,0.006529777828190062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,256,0.00452622233165635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,768,0.01577333278126187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,512,0.02360533343421088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,128,0.0038444445365005066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,512,0.013796444568369122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,256,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,256,0.02199288871553209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,64,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,32,0.0038284444146686127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,128,0.012152888708644442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,64,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,16384,32,0.013810666898886362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,65536,0.2701333363850911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,65536,0.21819467014736602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,16384,3072,0.020938666330443487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,51200,0.21238666110568574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,16384,0.0712782210773892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,51200,0.16834399435255262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,3072,0.0351857774787479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,12288,0.05557511250178019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,768,0.025137777129809063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,16384,0.06367378102408515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,10240,0.04584533307287428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,16384,128,0.01921777758333418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,12288,0.06237688991758558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,12288,0.04829244481192695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,10240,0.04243822230233086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,8192,0.03926400012440152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,7168,0.03393955694304572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,10240,0.05631111065546671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,8192,0.037716444995668195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,6144,0.029680000411139593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,8192,0.05010044574737549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,65536,0.23151644070943198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,7168,0.0335440006521013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,51200,0.186518218782213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,7168,0.04696089029312134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,6144,0.030597332451078627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,4096,0.02257866660753886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,6144,0.04331466555595398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,3584,0.01919644408755832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,5120,0.040256887674331665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,4096,0.02362577782736884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,4096,0.0369031098153856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,3584,0.021827555365032617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,3584,0.03589422172970242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,2560,0.014208000567224292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,3072,0.020651555723614164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,3072,0.03301422132386102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,2048,0.012422222230169507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,2560,0.03257333238919576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,16384,0.07716088824801974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,2560,0.01959111127588484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,1536,0.010299555957317352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,2048,0.018233777748213876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,2048,0.030464887619018555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,1024,0.008606221940782335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,1536,0.016591999265882704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,1536,0.02905155552758111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,768,0.0074888889988263445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,1024,0.025348444779713947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,1024,0.014934221903483072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,512,0.00526311124364535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,768,0.025222222010294598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,768,0.014138667119873894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,256,0.00424177779091729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,512,0.023318222827381555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,512,0.013352889153692456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,5120,0.025810667210155066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,128,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,256,0.0233324451578988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,64,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,5120,0.02665422194533878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,32,0.0035075553589397003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,128,0.012430222498046027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,12288,128,0.01920711166328854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,12288,3072,0.017065778374671936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,32,0.012832000023788877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,64,0.013774221969975365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,65536,0.20588533083597818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,51200,0.15976888603634304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,16384,0.05422844489415487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,65536,0.20767288737826875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,51200,0.1630044380823771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,12288,0.0432568887869517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,16384,0.06145066685146756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,12288,0.04622933268547058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,10240,0.03613244493802389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,16384,0.07511288589901395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,12288,0.0609875586297777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,10240,0.0407591097884708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,8192,0.03108533223470052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,12288,256,0.01275022245115704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,10240,0.055381334490246244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,7168,0.02650844388537937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,8192,0.03593066665861342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,51200,0.1795182228088379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,6144,0.02329066726896498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,8192,0.048935999472936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,7168,0.03251733382542928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,5120,0.020233778489960563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,65536,0.22315822707282174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,4096,0.017982222967677645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,6144,0.029473778274324205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,3584,0.014927999840842353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,7168,0.04520710971620348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,5120,0.02590399980545044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,5120,0.038887110021379255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,4096,0.03678844372431437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,4096,0.022682666778564453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,3584,0.021613332960340712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,3072,0.020224000016848247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,3072,0.03398933344417148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,2048,0.01055022246307797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,2560,0.019161777363883126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,2560,0.031769778993394636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,1536,0.009172444542249044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,2048,0.018187556001875136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,2048,0.03149244520399306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,1024,0.007253333098358578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,1536,0.015802666544914246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,1536,0.029121776421864826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,768,0.00591555568906996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,1024,0.014785778191354541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,1024,0.025018667181332905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,512,0.004518222063779831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,768,0.014135999812020196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,768,0.025382222400771245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,256,0.003899555653333664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,512,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,512,0.02437066700723436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,128,0.0037697777152061462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,256,0.012496000362767113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,256,0.02179644505182902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,6144,0.042018665207756885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,64,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,128,0.012415111064910889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,32,0.0032400000426504347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,128,0.020597333709398907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,3072,0.013728888498412238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,10240,3584,0.03492355677816603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,64,0.012164444559150271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,10240,32,0.013099555340078143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,65536,0.1748035616344876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,51200,0.14008977678087023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,16384,0.04798577891455757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,65536,0.16640178362528482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,51200,0.13032266828748915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,12288,0.03730310996373495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,16384,0.050266666544808276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,10240,0.031472888257768415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,16384,0.06947644551595052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,12288,0.0574151078859965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,10240,0.034338666333092585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,8192,0.026351999905374315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,10240,0.05269866519504123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,8192,0.02995733420054118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,51200,0.16545422871907553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,7168,0.023289778166347083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,6144,0.020273778173658583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,65536,0.20578932762145996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,7168,0.02637422250376807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,5120,0.017628444565667045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,7168,0.04426844583617317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,6144,0.024152888192070857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,6144,0.041519999504089355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,10240,2560,0.012160888976520963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,4096,0.01483022173245748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,3584,0.013439111411571503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,5120,0.02197066611713833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,5120,0.038725333081351385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,3072,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,3584,0.019161777363883126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,3584,0.03443288803100586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,2560,0.01054488867521286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,3072,0.01889244384235806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,3072,0.03186755710177951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,2048,0.009013333254390294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,12288,0.038444442881478205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,2560,0.017481777403089736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,2560,0.03252622154023912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,1536,0.007983999947706858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,2048,0.029792000850041706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,2048,0.016568000117937725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,1536,0.015208888385030957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,1024,0.006244444598754247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,1024,0.024847999215126038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,1024,0.014113777213626437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,768,0.004933333231343163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,768,0.024093333217832778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,768,0.013453333742088742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,512,0.004204444587230682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,512,0.013111111190583972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,256,0.0035377778112888336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,4096,0.02035288843843672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,4096,0.035767998960283064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,128,0.0034844444857703317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,256,0.012465777496496836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,256,0.02240088913175795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,64,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,128,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,128,0.01959733333852556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,8192,32,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,64,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,8192,32,0.012464889221721225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,65536,0.16382488939497206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,1536,0.02653955585426754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,65536,0.15714489089118108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,8192,0.04671555426385668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,51200,0.12646222114562988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,16384,0.04432355695300632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,16384,0.04931555522812737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,12288,0.03477511141035292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,8192,512,0.02295822236273024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,16384,0.06928177674611409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,10240,0.028980443874994915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,12288,0.037500444385740496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,12288,0.057130667898390025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,65536,0.20331199963887533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,10240,0.03303822212749057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,51200,0.16428977913326687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,10240,0.05215644505288866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,8192,0.02921244502067566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,7168,0.021764443980322942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,6144,0.018980445133315194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,8192,0.04638311266899109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,7168,0.04366311099794176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,5120,0.016538666354285348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,6144,0.023800889650980633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,6144,0.04061333338419596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,4096,0.01406222250726488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,51200,0.13083822197384304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,5120,0.02169422143035465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,3584,0.012471111284361945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,4096,0.01982933282852173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,4096,0.03542222248183356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,3072,0.011399110986126794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,3584,0.019222221440739103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,2560,0.010029333333174387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,3072,0.018186666899257235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,3072,0.03235733177926805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,2048,0.008611555728647444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,2560,0.017058667209413316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,2560,0.03129955463939243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,1536,0.00740533322095871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,2048,0.016193777322769165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,2048,0.029800001117918227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,1024,0.005551110953092575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,8192,0.024821332759327356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,1536,0.01475644442770216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,768,0.004916444420814514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,1024,0.013782222237851886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,1024,0.02437866727511088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,512,0.0041751112374994485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,768,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,768,0.02407199972205692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,7168,0.026721777187453374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,256,0.0035662220584021676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,512,0.012703999876976013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,512,0.023345778385798138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,128,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,256,0.02154133386082119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,256,0.012131555212868584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,5120,0.038254221280415855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,64,0.0028782222006056043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,128,0.018869333797030978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,7168,32,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,64,0.012811555630630918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,32,0.011798222031858234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,65536,0.13168533643086752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,3584,0.034466667307747736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,65536,0.15716532866160074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,51200,0.10424177514182197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,16384,0.0413955549399058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,51200,0.12067822615305583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,12288,0.03391733434465196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,16384,0.04765333400832283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,7168,1536,0.025695110360781353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,12288,0.03604711095492045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,10240,0.029438220792346533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,12288,0.056741330358717174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,8192,0.02204977803760105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,51200,0.16240266958872476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,10240,0.031664000617133245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,10240,0.051799999343024365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,7168,0.019696000549528334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,65536,0.20148889223734537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,8192,0.028194665908813477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,6144,0.016971555021074083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,8192,0.04510133465131124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,7168,0.04310933417744107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,7168,0.025430222352345783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,7168,128,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,5120,0.015338665909237333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,6144,0.03979111048910353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,4096,0.013459555804729462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,5120,0.037866665257347956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,5120,0.02130399975511763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,3584,0.011690666278203329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,4096,0.035271111461851336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,4096,0.01953866746690538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,3072,0.010621333287821876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,3584,0.018532445033391316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,3584,0.03432710965474447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,2560,0.010002666877375709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,3072,0.03200799889034695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,3072,0.017920000685585868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,2048,0.00832444429397583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,2560,0.03127022253142463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,2560,0.016917333006858826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,1536,0.007699555820888943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,2048,0.015127999915017022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,2048,0.029055999384986028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,1024,0.005604444278611078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,768,0.004965333475006951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,1536,0.025359110699759588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,1024,0.02504355543189579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,1024,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,512,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,768,0.02365333338578542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,256,0.003530666646030214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,512,0.012446222205956778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,512,0.02365155518054962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,128,0.0032311110860771606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,256,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,256,0.02162577708562215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,64,0.0028808888875775864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,6144,0.02360533343421088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,128,0.018254222141371835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,64,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,32,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,65536,0.11333510610792373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,65536,0.15173066986931696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,6144,16384,0.06882044341829088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,1536,0.014140443669425117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,51200,0.09296711285909016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,16384,0.03604177633921305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,768,0.012795555922720166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,51200,0.11966044372982448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,16384,0.046522667010625206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,65536,0.19885778427124023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,16384,0.06863555643293592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,10240,0.02683999968899621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,12288,0.03531644410557217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,6144,32,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,51200,0.16065066390567356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,8192,0.019136889113320243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,12288,0.05618221892250908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,10240,0.03053955568207635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,7168,0.016693333784739178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,10240,0.05083822210629781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,8192,0.04532355401251051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,6144,0.014528888795110913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,7168,0.025030222203996446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,7168,0.04214222232500712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,5120,0.013038222160604266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,6144,0.039523555172814265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,6144,0.023299554983774822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,4096,0.011319110790888468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,5120,0.02120622164673275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,5120,0.03730488816897074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,3584,0.011338666909270816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,4096,0.0196115556690428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,4096,0.03463911016782125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,3072,0.01054488867521286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,3584,0.033725334538353816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,3584,0.01870044403605991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,2560,0.009595555563767752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,3072,0.017551110850440133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,3072,0.03138400117556254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,2048,0.008609777523411645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,2560,0.03046755658255683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,12288,0.03090933296415541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,1536,0.006966222491529252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,2048,0.01459111107720269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,1024,0.0052639999323421055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,1536,0.02502577834659153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,1536,0.014124444789356656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,768,0.00464088883664873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,1024,0.013404444687896304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,1024,0.02400622268517812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,512,0.004232888834344016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,768,0.02425688836309645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,768,0.01314311143424776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,8192,0.02719555629624261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,512,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,256,0.0034871109657817413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,512,0.022983110613293115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,128,0.003152888889114062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,256,0.022721777359644573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,256,0.011702222128709158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,64,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,128,0.011163555913501315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,128,0.01960000064637926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,5120,32,0.002883555574549569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,64,0.011720000041855706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,32,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,65536,0.09120355712042914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,51200,0.07554755608240764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,65536,0.11176355679829915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,5120,2048,0.027021333575248718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,16384,0.03126755687925551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,6144,128,0.012040889097584618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,51200,0.08814755413267349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,12288,0.02576444380813175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,16384,0.03525866733656989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,16384,0.06812089019351535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,65536,0.1978142261505127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,12288,0.02721333338154687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,10240,0.022522666388087805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,51200,0.15994221634334987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,12288,0.05515199899673462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,8192,0.01622488929165734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,7168,0.014463999205165438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,10240,0.024129778146743774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,10240,0.0506586664252811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,6144,0.012729778057999082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,8192,0.04459111226929558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,8192,0.022288888692855835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,5120,0.011352889239788055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,7168,0.020594666401545208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,7168,0.04223733478122287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,4096,0.01036088913679123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,6144,0.019273777802785236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,6144,0.039234668016433716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,3584,0.009117333425415887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,5120,0.03742311067051358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,5120,0.01789155602455139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,4096,0.016526222229003906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,3072,0.008288000192907121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,4096,0.03453777896033393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,5120,2560,0.015504888362354703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,2560,0.007844444778230455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,3584,0.016134222348531086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,2048,0.006897777732875612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,3072,0.031897776656680636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,3072,0.014563555518786112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,1536,0.0052328887912962176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,2560,0.014206222361988492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,2048,0.02769688930776384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,1024,0.004575110971927643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,1536,0.013016000390052795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,1536,0.025695110360781353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,768,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,1024,0.024216888679398432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,1024,0.012811555630630918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,512,0.003567111161020067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,768,0.02366311185889774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,768,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,256,0.003273777870668305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,512,0.022679999470710754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,512,0.01240533341964086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,128,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,256,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,64,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,128,0.018232888645595975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,128,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,4096,32,0.0031386667655573953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,64,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,32,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,65536,0.10872089200549656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,3584,0.03286044465170966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,51200,0.06627733177608915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,2560,0.02888800038231744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,4096,2048,0.01348977784315745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,16384,0.02808177802297804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,51200,0.08649688959121704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,65536,0.19741243786282012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,12288,0.02311644454797109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,16384,0.03330933385425144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,16384,0.06730488936106364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,12288,0.026100445124838088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,12288,0.05567022164662679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,51200,0.159588442908393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,8192,0.018906666172875296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,10240,0.023580445183648005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,4096,256,0.021351110604074266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,10240,0.050604446066750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,7168,0.01365066650840971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,6144,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,8192,0.04442488816049364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,8192,0.021695110532972548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,7168,0.020298666424221463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,5120,0.011008888483047485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,6144,0.01886666648917728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,6144,0.03941155473391215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,4096,0.00998399986161126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,5120,0.01787911189926995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,5120,0.037032888995276556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,3584,0.008650666309727563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,4096,0.016492444607946608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,4096,0.03424088822470771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,3072,0.008100444244013892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,3584,0.015512888630231222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,3584,0.03207022282812331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,2560,0.006950221955776215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,3072,0.01481066644191742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,3072,0.029166221618652344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,2048,0.0059368887709246735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,2560,0.013800889253616333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,10240,0.02123466630776723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,1536,0.004920000003443824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,2048,0.027061333258946735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,1536,0.012861332959598966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,1536,0.025762667258580525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,1024,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,7168,0.04253600041071574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,1024,0.012738666600651212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,1024,0.0240000006225374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,768,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,512,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,768,0.02366399930583106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,768,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,256,0.003491555651028951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,512,0.01239733315176434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,512,0.02251911163330078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,128,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,256,0.022653333014912073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,128,0.01143200033240848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,128,0.020241777102152508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,64,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,32,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3584,2560,0.0284551117155287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,64,0.012064889073371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,32,0.011385777758227454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,2048,0.013404444687896304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,65536,0.07168889045715332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,51200,0.058766219351026744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,65536,0.10609600279066299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,16384,0.0225582222143809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,51200,0.08439111047320896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3584,65536,0.08232888910505506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,12288,0.018744000130229525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,16384,0.03253777821858724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,16384,0.06710488928688897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,10240,0.016522667474216886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,51200,0.15934577253129747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,8192,0.014785778191354541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,12288,0.05455733338991801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,10240,0.023267555567953322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,10240,0.050168000989490084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,7168,0.013619555367363824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3584,256,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,8192,0.021032000581423443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,8192,0.04418399930000305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,6144,0.01202933324707879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,5120,0.011009777585665384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,7168,0.04155911008516947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,6144,0.038704001241260104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,6144,0.018600889378123812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,4096,0.009974222216341231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,5120,0.017217778497272067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,3584,0.008772444393899705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,4096,0.03404266635576884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,4096,0.015136000182893542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,3072,0.007913777397738563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,3584,0.014793778459231058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,3584,0.031389332479900785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,2560,0.007248889240953658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,3072,0.014134221606784396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,3072,0.028817776176664565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,2048,0.00656444455186526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,2560,0.013752000199423896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,2048,0.013360888593726687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,2048,0.02622755534119076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,1536,0.0052684446175893145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,65536,0.19713777965969512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,1024,0.004237333519591225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,12288,0.02572711143228743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,1536,0.025711999999152288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,1536,0.012784000072214337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,768,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,1024,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,1024,0.025199999411900837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,512,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,768,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,768,0.023689778314696416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,7168,0.020006222857369315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,256,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,512,0.0226248883538776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,512,0.012266666524940066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,256,0.02232622272438473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,256,0.011720000041855706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,64,0.0028862222615215513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,128,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,128,0.01947022146648831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,32,0.0029893333299292457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,64,0.011529777612951068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,65536,0.06293066342671712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,3072,32,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,51200,0.04934844374656677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,65536,0.10400799910227458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,2560,0.02754577828778161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,16384,0.02232088810867733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,51200,0.07968799935446845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,65536,0.19666666454739043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,16384,0.031121777163611516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,16384,0.06663378079732259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,51200,0.1598337756262885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,10240,0.016137777103318107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,12288,0.025311999850802954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,12288,0.05460888809627957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,8192,0.014460444450378418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,3072,128,0.0028844444702068963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,10240,0.022857778602176245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,10240,0.050007111496395536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,7168,0.012541333006487953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,3072,5120,0.03644711110326979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,8192,0.021332444416152105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,8192,0.04383200075891283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,6144,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,7168,0.019613333874278598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,7168,0.04157511062092251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,6144,0.038691557115978666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,6144,0.01832799944612715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,4096,0.008959111240175035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,5120,0.036736889017952815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,5120,0.01648266613483429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,3584,0.00829777783817715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,4096,0.015138667490747241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,4096,0.03255733185344272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,3072,0.007772444850868649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,3584,0.014522666732470194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,3584,0.031113776895735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,2560,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,3072,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,3072,0.02984444300333659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,2048,0.006056889063782162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,2560,0.013776000175211163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,2560,0.02776799930466546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,1536,0.005024000174469418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,2048,0.0262071109480328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,2048,0.013447110851605734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,12288,0.018515555395020377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,1024,0.004231111043029361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,1536,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,1536,0.025401777691311304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,1024,0.02437777817249298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,1024,0.012521777715947894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,512,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,768,0.02365866634580824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,768,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,256,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,512,0.022330666581789654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,512,0.01221422188811832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,128,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,256,0.02125066684352027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,256,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,64,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,32,0.002971555623743269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,5120,0.010332444475756751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,128,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,65536,0.052348444859186806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,64,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2560,32,0.0110871113008923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,51200,0.042740444342295326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,16384,0.018633777896563213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,65536,0.100545777214898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,51200,0.07789866791831122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,16384,0.030525333351559106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,12288,0.015295111470752291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,51200,0.15903822580973306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,65536,0.19700000021192762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,10240,0.015443555182880826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,12288,0.05460000038146973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,12288,0.02478844424088796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,8192,0.013404444687896304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,10240,0.02269422180122799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,10240,0.04960799879497952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,8192,0.0199955552816391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2560,768,0.0038808890514903595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,6144,0.011153777440388998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,7168,0.01864266726705763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,7168,0.041464000940322876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,5120,0.0124177775449223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,6144,0.017551110850440133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,6144,0.038247111770841814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,4096,0.010999110837777456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,5120,0.01647911138004727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,5120,0.035509334670172796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2560,128,0.019306666321224637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,4096,0.014937778313954672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,4096,0.03166933192147149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,3072,0.008323555191357931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,3584,0.014767999450365702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,3584,0.03087288803524441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,3072,0.029164443413416546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,2560,0.007613333563009898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,16384,0.0661768913269043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,2560,0.013595555391576556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,2560,0.02740266587999132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,2048,0.006575111299753189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,7168,0.01202488856183158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,8192,0.04382933179537455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,1536,0.004612444589535396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,2048,0.026330666409598455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,2048,0.013139555851618448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,1024,0.004230222354332606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,1536,0.012747555143303342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,1536,0.025758221745491028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,768,0.0038977778620190094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,1024,0.012320888539155325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,512,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,768,0.02370311154259576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,512,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,256,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,512,0.022288888692855835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,256,0.021301334102948506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,256,0.011695110963450538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,128,0.00300177786913183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,3072,0.014104000396198697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,128,0.018888889087571036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,64,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,32,0.0028808888875775864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,32,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,65536,0.03830133212937249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,2048,1024,0.02404533326625824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,768,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,65536,0.09458221991856892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,3584,0.009672000176376766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,51200,0.03119644522666931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,16384,0.01792622274822659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,51200,0.07573422458436754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,65536,0.19651110967000326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,12288,0.015093333191341825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,16384,0.03010666701528761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,51200,0.1589733362197876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,16384,0.06635555293824938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,10240,0.013832000394662222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,12288,0.024353777368863423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,2048,128,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,12288,0.05437689026196798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,8192,0.012654222548007965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,7168,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,10240,0.04911999901135763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,8192,0.043939554029040866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,8192,0.01984177695380317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,6144,0.010727110836240979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,7168,0.017869333426157635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,7168,0.040568000740475126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,5120,0.009979555176364051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,6144,0.01684266659948561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,6144,0.03750666644838121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,4096,0.00943022221326828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,5120,0.015795555379655626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,5120,0.034625778595606484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,3584,0.007632888853549957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,4096,0.014993778533405729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,4096,0.031848000155554876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,3072,0.006779555645253923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,3584,0.03056710958480835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,2560,0.005938666562239329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,3072,0.013859555953078799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,3072,0.029726223813162908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,2048,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,2560,0.013726222018400827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,2560,0.027079999446868896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,1536,0.0047048889100551605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,2048,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,2048,0.02606133288807339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,1024,0.003899555653333664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,1536,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,1536,0.025702221526039973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,2048,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,768,0.003576888806290097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,1024,0.012416000167528788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,10240,0.022336888644430373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,512,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,256,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,768,0.02461244497034285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,768,0.012336889074908363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,128,0.002855111120475663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,512,0.011753777662913004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,512,0.023260444402694702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,64,0.0028026666906144884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,256,0.022290666898091633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,256,0.011443555355072021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1536,32,0.002797333316670524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,128,0.0185217774576611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,65536,0.02784088916248745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,64,0.011704000333944956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,32,0.0107351111041175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,51200,0.023640000157886084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,65536,0.09086489015155369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,3584,0.014454222387737699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,16384,0.01443377799457974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,51200,0.07441155778037177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,65536,0.19632532861497667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,51200,0.15979466173383924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,12288,0.012701333396964602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,16384,0.02979288829697503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,10240,0.011598221957683563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,12288,0.053900443845325045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,12288,0.02365866634580824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,8192,0.012601777911186218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,10240,0.0209840006298489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,10240,0.04821955495410495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,7168,0.011800000237094032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,8192,0.01889866590499878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1536,1024,0.023715555667877197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,6144,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,7168,0.039429333474900984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,6144,0.016732444365819294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,5120,0.010296888649463654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,6144,0.03683200147416856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,5120,0.034585777256223894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,4096,0.00869599978129069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,4096,0.014846222268210517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,16384,0.0664773318502638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,4096,0.03223377797338698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,3584,0.007250666618347168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,3584,0.03054311209254795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,3584,0.014499555031458536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,3072,0.00675644435816341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,8192,0.042083554797702365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,3072,0.028148445818159316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,2560,0.005951111101441913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,7168,0.017892445127169292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,2048,0.006268444574541516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,2560,0.0281057788266076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,1536,0.005560889012283749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1536,128,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,2048,0.027110222313139174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,2048,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,1024,0.004222222086456087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,1536,0.012776888906955719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,1536,0.025776000486479864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,5120,0.015570667054918079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,768,0.003952888978852166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,1024,0.024657777614063684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,512,0.003621333175235324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,1024,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,256,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,768,0.023334221707450017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,768,0.012208888928095499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,512,0.022407111194398668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,512,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,256,0.011704000333944956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,256,0.02095111045572493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,64,0.0028897778441508612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,1024,128,0.0192577772670322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,128,0.011353777514563667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,65536,0.031439112292395696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,64,0.011385777758227454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,51200,0.024897777371936377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,32,0.010695111420419482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,65536,0.0920320020781623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,16384,0.012149333126015134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,3072,0.014148443937301636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,51200,0.07214044200049506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,65536,0.196615113152398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,51200,0.15858756171332464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,16384,0.02901511059867011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,1024,2560,0.013403555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,10240,0.009891555541091496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,12288,0.023033777872721355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,12288,0.0529457794295417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,8192,0.009355555805895064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,10240,0.04727288749482897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,10240,0.02121688922246297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,7168,0.008965333302815756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,8192,0.0188737776544359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,8192,0.04109777675734626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,6144,0.009485333330101436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,7168,0.017684444785118103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,7168,0.03906844390763177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,5120,0.008127999802430471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,6144,0.01664266652531094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,6144,0.03628888726234436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,1024,128,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,4096,0.007589333587222629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,3584,0.007635555333561367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,5120,0.03430577781465318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,5120,0.015480000111791821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,3072,0.006568000134494569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,4096,0.0148026661740409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,4096,0.032257778777016535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,2560,0.005940444353553984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,3584,0.014478221535682678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,3072,0.013758222262064615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,2048,0.005244444641802046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,2560,0.013772444592581855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,2560,0.027423111928833857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,1536,0.004828444371620814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,2048,0.02706844442420536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,2048,0.013057777451144325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,1024,0.0039022221333450745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,1536,0.012838222086429596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,1536,0.0262080000506507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,12288,0.010973333484596677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,768,0.0034933334423436057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,1024,0.012123555772834353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,16384,0.06622311141755846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,512,0.0031991110493739447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,1024,0.025379555092917547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,768,0.02471911079353756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,768,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,256,0.0028479999552170434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,128,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,512,0.022426666484938726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,256,0.02111111084620158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,256,0.011702222128709158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,64,0.002485333424475458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,128,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,128,0.018187556001875136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,65536,0.02328266700108846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,64,0.011694221860832639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,32,0.011123555401961008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,51200,0.01871200071440803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,65536,0.08892089128494263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,65536,0.19663555092281768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,3584,0.03052355514632331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,51200,0.06951822174919976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,16384,0.012602667013804117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,768,3072,0.02881422307756212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,12288,0.010320888625250923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,51200,0.15806489520602757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,10240,0.010001777774757808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,16384,0.027808000644048054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,16384,0.06541155444251166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,12288,0.02259822189807892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,12288,0.051967998345692955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,8192,0.009345778160625035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,7168,0.009000000026490953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,10240,0.04738755689726936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,8192,0.04138488901986016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,8192,0.018366222580273945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,6144,0.0075777777367168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,7168,0.017872000734011333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,7168,0.0388062232070499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,5120,0.008329778081840938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,6144,0.016255110502243042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,6144,0.03649955656793382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,768,512,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,4096,0.007520889242490132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,3584,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,5120,0.03458844290839301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,5120,0.015507555670208402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,3072,0.006287999865081575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,768,32,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,4096,0.014817777607176038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,4096,0.032207111517588295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,2560,0.0059057776298787855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,3584,0.031119111511442397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,3584,0.014152889450391134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,2048,0.0052915554907586836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,3072,0.013805333111021252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,2560,0.013752889302041797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,2048,0.012904889053768583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,2048,0.026736888620588515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,1024,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,1536,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,1536,0.02442311081621382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,768,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,1024,0.012426666915416718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,1024,0.024283554818895128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,512,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,768,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,768,0.0240320000383589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,256,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,512,0.011753777662913004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,10240,0.020246222615242004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,512,0.02233155568440755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,128,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,256,0.02201866606871287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,128,0.018183999591403537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,64,0.0025439999169773525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,128,0.011346666349305047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,65536,0.0166320006052653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,64,0.011136888629860349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,32,0.010712888505723743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,51200,0.014271999398867289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,65536,0.08496799733903672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,3072,0.02791644467247857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,512,1536,0.004576888763242298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,65536,0.19592800405290392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,16384,0.009703111317422655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,51200,0.06729866398705377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,12288,0.008381333616044786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,51200,0.1583555539449056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,16384,0.06338755289713542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,10240,0.009339555270142024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,12288,0.022322666313913133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,12288,0.051648888323042125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,8192,0.008292444050312042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,10240,0.020302222834693063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,10240,0.046572443511750966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,7168,0.008164444731341468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,8192,0.01830577850341797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,8192,0.0414044459660848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,6144,0.007606222397751278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,7168,0.017346666918860543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,7168,0.038719111018710665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,5120,0.007981333467695449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,512,256,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,6144,0.035953776703940496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,4096,0.007351111206743453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,6144,0.016177778442700703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,5120,0.03392533461252848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,5120,0.01535999940501319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,3584,0.006976000136799282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,3072,0.006970666348934174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,4096,0.032223112053341336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,3584,0.030511998467975195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,3584,0.014084445105658637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,2560,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,3072,0.013750221994188098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,3072,0.029490666257010564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,2048,0.006248888870080312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,512,2560,0.028113779094484117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,2560,0.02725244396262699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,1536,0.004238222208287981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,2048,0.026512889398468867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,2048,0.013152889079517789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,1024,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,1536,0.012383999923865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,1536,0.02608355548646715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,768,0.003491555651028951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,1024,0.0236488895283805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,1024,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,512,0.003208000005947219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,768,0.012106666962305704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,256,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,512,0.012062222593360476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,512,0.021613332960340712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,128,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,256,0.021624000536070928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,256,0.011683555940786997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,64,0.0024871110088295406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,128,0.011035555766688453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,256,32,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,128,0.01924622224436866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,65536,0.015470221638679504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,64,0.011543999943468304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,32,0.01073333372672399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,4096,0.014143110977278816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,51200,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,65536,0.08437244759665595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,16384,0.009866666462686326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,51200,0.06651910808351305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,51200,0.15784266259935167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,2560,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,12288,0.008302222523424361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,16384,0.02749866743882497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,16384,0.06300710969501071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,10240,0.007651555869314406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,12288,0.022209778428077698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,12288,0.05138311121198866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,8192,0.007288888924651676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,10240,0.0472302238146464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,10240,0.02023555503951179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,7168,0.0069715554515520734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,256,768,0.023373333944214716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,8192,0.01847822301917606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,8192,0.04076177875200907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,6144,0.006581333362393909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,5120,0.006241777704821692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,7168,0.03930577635765076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,7168,0.01718311177359687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,4096,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,6144,0.016269332832760282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,5120,0.0151582227812873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,5120,0.03449599941571554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,3584,0.006263999889294307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,4096,0.014416888356208801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,4096,0.03127466638882955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,3072,0.005949333310127258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,3584,0.014450665977266101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,3584,0.030200888713200886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,2560,0.006313777632183499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,3072,0.013541333377361298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,3072,0.028781334559122723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,2048,0.006256888724035687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,2560,0.02881866693496704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,2560,0.01312800000111262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,65536,0.19591732819875082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,1536,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,2048,0.012753778033786349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,1024,0.0038648889296584656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,1536,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,768,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,1024,0.025412445267041523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,1024,0.012042666474978128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,256,16384,0.02713866697417365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,512,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,768,0.02330222229162852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,768,0.011735111474990845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,256,0.0029893333299292457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,512,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,512,0.022299556268586054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,128,0.0028071111689011254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,256,0.011191999746693505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,256,0.020922667450375024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,6144,0.035875555541780256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,128,0.011063999599880643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,32,0.0026462222966882917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,64,0.0107351111041175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,65536,0.013857777747843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,128,32,0.010383110907342698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,51200,0.012157333393891653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,65536,0.08268711302015516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,16384,0.007981333467695449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,51200,0.06612444586224027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,2048,0.026386666629049513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,12288,0.007324444750944774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,10240,0.007272889216740926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,1536,0.025765332910749648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,16384,0.02699911097685496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,8192,0.006917333437336816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,12288,0.022295110755496558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,7168,0.006575111299753189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,10240,0.020020445187886555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,8192,0.01795644395881229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,5120,0.006272000157170826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,7168,0.01722666621208191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,4096,0.005667555663320754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,6144,0.015799999237060547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,3584,0.006278222219811545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,5120,0.01514311134815216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,3072,0.0058986664646201665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,4096,0.014150222142537435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,2560,0.006239111224810283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,3584,0.013818666338920593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,2048,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,3072,0.013473778135246701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,1536,0.004217777815130022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,2560,0.013131555583741931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,1024,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,2048,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,768,0.003216000066863166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,1536,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,512,0.0031395554542541504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,1024,0.011762667033407422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,256,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,768,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,128,0.002528000002106031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,512,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,64,0.002522666628162066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,256,0.011024889018800525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,32,0.002493333278430833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,128,0.010767111347781287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,65536,0.012096888489193387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,64,6144,0.006280000011126201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,32,0.010406222608354356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,51200,0.010679999987284342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,16384,0.007252444823582967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,65536,0.08202133576075236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,12288,0.007272000114123027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,51200,0.06367822488149007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,16384,0.027003554834259882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,10240,0.007297777467303806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,128,64,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,8192,0.007158222297827403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,7168,0.0069395556218094295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,10240,0.02022133270899455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,8192,0.018254222141371835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,7168,0.01756266587310367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,5120,0.00627377794848548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,6144,0.016176000237464905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,4096,0.005892444401979446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,5120,0.015459555718633862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,3584,0.0062977779242727495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,3072,0.006260444306664997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,4096,0.014153778553009033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,2560,0.006005333529578314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,3584,0.014208000567224292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,2048,0.006245333287451003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,3072,0.013765333427323235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,1536,0.00453333349691497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,64,64,0.010666666759385003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,2560,0.013075555364290873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,1024,0.003826666623353958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,2048,0.013075555364290873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,1536,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,512,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,1024,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,256,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,768,0.012072888513406118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,128,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,512,0.011769777370823754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,64,0.00254488881263468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,256,0.011182222101423474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,12288,0.022314666046036616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,128,0.011401777466138205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,32,0.002483555633160803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,6144,0.006232888748248418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,64,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,96,32,32,0.011364444262451597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,16384,0.21467199590471056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,96,32,768,0.0035439998739295532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,51200,0.63481691148546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,12288,0.2784213225046794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,12288,0.16008622116512722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,10240,0.2081244389216105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,51200,1.1441279517279732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,10240,0.13617066542307535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,8192,0.17154755857255724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,7168,0.15055378278096518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,8192,0.11629154947068955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,7168,0.09944533639483982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,6144,0.128767106268141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,5120,0.1095928880903456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,4096,0.08983822001351251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,16384,0.37257689899868435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,4096,0.06286666790644328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,6144,0.08753333489100139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,3072,0.06960178083843656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,3584,0.05758044454786512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,3584,0.07935733265346952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,2560,0.05788977940877279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,2048,0.04698488778538174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,3072,0.05110311177041796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,1536,0.03731377919514974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,2560,0.04569244384765625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,1024,0.028813332319259644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,2048,0.040159109565946795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,1536,0.04855733447604709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,768,0.021399110555648804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,1024,0.038089778688218855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,512,0.014693333042992486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,256,0.009296000003814697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,128,0.008009778128729926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,512,0.024496888120969135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,256,0.019089778264363606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,64,0.006005333529578314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,65536,32,0.006048000107208888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,768,0.03020355436537001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,128,0.017847110827763874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,64,0.017518222332000732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,32,0.019786667492654588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,65536,5120,0.07470577955245972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,16384,0.27678577105204266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,51200,0.5040426784091526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,16384,0.1739048825369941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,12288,0.20951555834876168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,65536,0.6633102099100748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,51200,0.8583351241217719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,10240,0.17682222525278726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,12288,0.12889777289496526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,65536,1.0915697945488823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,10240,0.11062400208579169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,8192,0.1441671053568522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,7168,0.1271173291736179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,5120,0.09230755435095893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,6144,0.1088542209731208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,6144,0.07194311088985868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,4096,0.07547377877765231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,3584,0.06683466831843059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,8192,0.09481066465377808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,7168,0.0815360016292996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,5120,0.061958220269944936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,3072,0.05863110886679756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,2560,0.04962311188379923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,2048,0.04048711061477661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,3072,0.0435733331574334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,3584,0.04830933279461331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,1536,0.032391111056009926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,2560,0.03913244605064392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,2048,0.03497688968976339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,1024,0.024332443873087566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,4096,0.05266044537226359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,768,0.017812444104088675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,512,0.012855110896958245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,256,0.00889244427283605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,1536,0.041466666592492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,128,0.005953777581453323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,64,0.005241777747869492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,512,0.02124622298611535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,256,0.017525333497259352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,1024,0.0324524442354838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,51200,32,0.00554577757914861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,128,0.016524444023768108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,64,0.01720622181892395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,32,0.01865955524974399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,16384,0.086444444126553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,51200,0.2620311048295763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,65536,0.3364497820536296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,65536,0.2623537646399604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,12288,0.06747466988033719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,51200,0.20261243979136148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,10240,0.05574488639831543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,16384,0.07512444257736206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,8192,0.04756266540951199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,12288,0.05635199944178263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,7168,0.04069066709942288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,8192,0.04344800114631653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,10240,0.0495760010348426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,6144,0.035475555393430926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,5120,0.03050044510099623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,7168,0.03838222225507101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,4096,0.025220443805058796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,3584,0.022618666291236877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,5120,0.030887110365761652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,6144,0.034918222162458636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,4096,0.02717599935001797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,3072,0.020000888241661918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,2560,0.01685422162214915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,3584,0.02515911062558492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,2048,0.014011555247836642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,1536,0.011352000137170156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,3072,0.02272266646226247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,1024,0.009294222626421187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,2560,0.02144533395767212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,768,0.0075342224703894714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,512,0.005929777605666055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,2048,0.019911110401153564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,1536,0.02144177754720052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,256,0.004221333397759331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,1024,0.018186666899257235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,128,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,768,0.017143110434214275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,64,0.003522666792074839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,512,0.015156444576051501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,256,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,128,0.012618666721714867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,32,0.013394667042626275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,16384,64,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,65536,0.27327556080288357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,51200,0.21174577871958414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,65536,0.20978489187028673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,16384,0.07163733243942261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,51200,0.1630515522427029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,12288,0.05613155497445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,10240,0.04604977700445387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,16384,0.061906668874952525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,12288,0.047107554144329496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,8192,0.038797332180870905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,10240,0.04152533411979675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,7168,0.03380622135268317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,6144,0.029673778348498877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,51200,768,0.025470222036043804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,8192,0.036644445525275335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,5120,0.025797333982255723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,4096,0.022311111291249592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,7168,0.03282399972279867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,6144,0.02999911043379042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,3584,0.019018666611777413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,3072,0.016982222596804302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,5120,0.026491555902693007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,2560,0.014473777678277759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,4096,0.022847111026446026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,2048,0.01274400038851632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,3584,0.022108443909221228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,3072,0.020558221472634208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,16384,32,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,1024,0.008612444831265343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,2560,0.019482667247454327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,2048,0.018073777357737224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,768,0.007317333585686154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,512,0.005700444595681296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,256,0.0041866666740841335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,1024,0.01684888866212633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,128,0.0035822221802340615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,512,0.014157333307796054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,64,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,256,0.012723555167516073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,32,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,128,0.0127688886390792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,64,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,32,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,65536,0.24890311559041342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,65536,0.2018115520477295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,51200,0.16448177231682673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,16384,0.05595111184649997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,12288,0.044181333647833936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,51200,0.15705155001746282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,16384,0.06025866667429606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,10240,0.039832890033721924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,12288,1536,0.010319111247857412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,8192,0.032187554571363665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,12288,0.045202665858798556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,7168,0.029129776689741347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,10240,0.04032889008522034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,6144,0.024694222542974684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,1536,0.01994755533006456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,8192,0.03587199913130866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,4096,0.01775644388463762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,7168,0.031641778018739485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,6144,0.028487109475665625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,3584,0.016343999240133498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,5120,0.02512888941499922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,3072,0.014404444230927361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,4096,0.022467555271254644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,2560,0.012719111310111152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,3584,0.021426666114065383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,3072,0.020242666204770405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,2048,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,1536,0.009372444616423713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,2560,0.01921244462331136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,1024,0.007650666766696506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,2048,0.01779911087618934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,768,0.006118222243256039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,1024,0.01573511130279965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,512,0.0052044445441828836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,768,0.01534755527973175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,256,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,512,0.013637333280510373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,128,0.0038444445365005066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,256,0.0127368892232577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,64,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,128,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,5120,0.02167111138502757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,10240,32,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,64,0.012802666260136498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,12288,768,0.01520088811715444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,32,0.013154666456911298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,65536,0.17547821998596191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,51200,0.13451643784840903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,16384,0.048319111267725624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,65536,0.15893599722120497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,12288,0.03789955708715651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,51200,0.12307377656300862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,10240,0.031050665511025324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,16384,0.04857244425349765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,8192,0.0273297776778539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,12288,0.03765599926312765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,7168,0.02328266700108846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,10240,1536,0.018174222773975797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,10240,0.0335804455810123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,6144,0.02053777707947625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,8192,0.029791110091739233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,5120,0.017510222064124215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,4096,0.01568888955646091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,3584,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,5120,0.021588444709777832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,4096,0.020139555136362713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,3072,0.01201777739657296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,2560,0.010428444378905825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,3584,0.019075555933846366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,2048,0.009276444713274637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,3072,0.018223999275101554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,2560,0.017504000001483493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,2048,0.01642933322323693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,1024,0.005896889087226655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,1536,0.01683555543422699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,768,0.004584889031118817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,1024,0.014427555931939019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,768,0.014135999812020196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,512,0.0041742221348815495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,256,0.003559111307064692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,512,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,256,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,128,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,64,0.003228444399105178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,32,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,7168,0.026111111044883728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,128,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,64,0.01238044434123569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,6144,0.02365066607793172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,8192,32,0.012159999873903064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,16384,0.04335911075274149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,65536,0.15426666206783718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,51200,0.12167733245425755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,12288,0.03478755553563436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,51200,0.12161866823832194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,10240,0.028685334655973647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,8192,1536,0.00795911086930169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,16384,0.04820088876618279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,12288,0.03646666804949442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,7168,0.021577777134047613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,10240,0.032531556155946516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,6144,0.018971555762820773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,8192,0.02868177824550205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,5120,0.016527111331621807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,4096,0.014073777529928418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,7168,0.025204444924990337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,3584,0.012423999607563019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,6144,0.023540443844265405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,5120,0.021386666430367365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,3072,0.011304000185595619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,4096,0.01981244484583537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,2560,0.009680888719028896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,2048,0.008720888859695857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,3072,0.018168000711335074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,1536,0.007393777370452881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,2560,0.01739377776781718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,1024,0.005949333310127258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,2048,0.01569955547650655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,768,0.004888888862397936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,1536,0.01685066686736213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,512,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,1024,0.014458666245142618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,768,0.014098667436175875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,256,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,512,0.013464888764752282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,128,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,65536,0.15437422858344182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,256,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,64,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,32,0.0032177778581778207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,128,0.012092444631788464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,64,0.011785777906576792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,7168,8192,0.024874667326609295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,32,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,65536,0.14172532823350695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,51200,0.11305422253078884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,65536,0.14932000637054443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,51200,0.1167680025100708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,7168,3584,0.019289778338538278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,12288,0.03302222159173753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,16384,0.04622133241759407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,10240,0.029305779271655615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,8192,0.023119111855824787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,12288,0.03576888971858554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,7168,0.019626667102177937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,10240,0.0316826668050554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,6144,0.0173662222094006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,5120,0.014415999253590902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,7168,0.024559110403060913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,6144,0.023080888721677992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,4096,0.013185777597957186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,3584,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,5120,0.020968000094095867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,3072,0.01054844425784217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,4096,0.0195448895295461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,2560,0.009653333160612319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,3584,0.01888088881969452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,3072,0.01789066692193349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,2048,0.00830844458606508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,1536,0.006940444310506185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,2560,0.016499555773205228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,2048,0.01514311134815216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,1024,0.006232000059551663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,768,0.004579555657174853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,1536,0.016093333562215168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,512,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,16384,0.04285155402289497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,1024,0.0141004439857271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,256,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,768,0.013815999858909182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,128,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,64,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,512,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,6144,32,0.0032186667538351486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,256,0.012416889270146688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,128,0.011865778101815118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,64,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,65536,0.11024444633060032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,32,0.011713777979214987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,51200,0.08812355332904392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,16384,0.03465777635574341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,12288,0.028927998410330877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,65536,0.1458479960759481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,6144,8192,0.02751111156410641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,10240,0.02535377773973677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,51200,0.11470845010545518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,16384,0.045496000183953174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,8192,0.022666666242811415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,7168,0.020267556111017864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,12288,0.03434755404790243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,6144,0.014482667048772177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,5120,0.013103110922707452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,8192,0.02675466736157735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,4096,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,7168,0.024381332927280005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,3584,0.010079999764760336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,6144,0.022808000445365906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,3072,0.010665777656767102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,5120,0.020786666207843356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,2560,0.009491555392742157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,4096,0.019440000255902607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,2048,0.008260444634490544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,3584,0.018541332748201158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,1536,0.006948444578382704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,1024,0.005250666704442766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,3072,0.016719111137919955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,2560,0.015875554747051664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,768,0.004882666799757215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,2048,0.014782221780882942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,512,0.004576888763242298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,1536,0.014651555154058667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,256,0.0038008888562520346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,1024,0.013758222262064615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,128,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,64,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,768,0.013824000126785703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,512,0.013088000317414602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,5120,32,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,256,0.011974222130245633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,128,0.011535111400816174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,64,0.011686222420798408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,65536,0.08909244669808282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,32,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,51200,0.07255822420120239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,16384,0.031094223260879517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,65536,0.10469510820176865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,12288,0.024829333027203877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,96,128,128,0.01824711097611321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,51200,0.082805335521698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,10240,0.021852445271280076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,16384,0.03336355421278212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,8192,0.016122667325867545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,12288,0.025729777084456548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,10240,0.02330400049686432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,6144,0.012759110993809171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,5120,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,7168,0.019882667395803664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,5120,10240,0.03044355577892727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,4096,0.010037333601050908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,6144,0.01903555625014835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,3584,0.009017777939637503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,5120,0.017551110850440133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,3072,0.008636444807052612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,2560,0.007596444752481248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,3584,0.015793777174419828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,3072,0.014888000157144336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,2560,0.014103111293580798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,1536,0.005495999836259418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,2048,0.013458666702111563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,1024,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,1536,0.01408622165520986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,768,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,1024,0.01293955577744378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,512,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,768,0.012791111237472959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,256,0.0032844444115956626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,512,0.012479110724396177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,128,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,7168,0.01440533333354526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,256,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,64,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,32,0.002987555538614591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,8192,0.02176800039079454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,128,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,64,0.011426666544543372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,65536,0.07885155412885878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,32,0.011372444530328115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,51200,0.06367733081181844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,16384,0.028868443436092798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,65536,0.10242044263415867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,4096,4096,0.016568889220555622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,12288,0.02330133318901062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,10240,0.02034311162100898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,4096,2048,0.006606222026877933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,51200,0.0809804466035631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,8192,0.017644445101420086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,7168,0.013609777722093793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,12288,0.02498311135503981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,16384,0.031975110371907554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,6144,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,5120,0.01071733319097095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,8192,0.021239999267790053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,4096,0.009974222216341231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,7168,0.019679110911157396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,3584,0.008744888835483128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,6144,0.018235555953449674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,3072,0.007948444121413762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,2560,0.007177777588367462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,4096,0.015470221638679504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,2048,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,3584,0.015487111277050443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,3072,0.014249778456158109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,1536,0.004923555586073133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,2560,0.013983110586802164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,2048,0.01313511116637124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,768,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,1024,0.012741333080662621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,512,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,768,0.01276000009642707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,256,0.0032239999208185407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,512,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,128,0.0032071111102898917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,256,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,64,0.002999111182159848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,128,0.011368888947698804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,32,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,64,0.011607111328177981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,10240,0.023016888234350417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,65536,0.0698195563422309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,32,0.011047999891969891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,51200,0.055493334929148354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,16384,0.023749333288934495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,5120,0.017166222135225933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,65536,0.09996710883246528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,12288,0.01977244516213735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,51200,0.07894311348597209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,10240,0.017208000024159748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,16384,0.03117155697610643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,8192,0.015303999185562134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,7168,0.013066666821638743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,12288,0.024671999944580927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,10240,0.022337777747048274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,6144,0.012378666963842181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,8192,0.020611556039916146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3584,1536,0.013789333403110504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,4096,0.009668444593747457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,6144,0.018201778332392376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,3584,0.008607111043400234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,5120,0.016600888636377122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,3072,0.008264000217119852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,4096,0.01483022173245748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,2560,0.007486222518814935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,3584,0.015127110812399121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,2048,0.006550222221348021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,3072,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,1536,0.0052684446175893145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,2560,0.013839999834696451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,1024,0.004559999952713649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,2048,0.013386666774749756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,768,0.003960888832807541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,1536,0.01348355578051673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,512,0.0035573335157500375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,1024,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,256,0.0034764446318149567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,768,0.0127688886390792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,128,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,512,0.012182222472296821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,64,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,256,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,128,0.011704000333944956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,64,0.011762667033407422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3584,1024,0.0042168887125121225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,32,0.011388444238238864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,5120,0.011007111105653973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,51200,0.05327999922964308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,3072,7168,0.0192248887485928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,16384,0.02149066660139296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,65536,0.09660622146394517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,12288,0.017882666654056974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,51200,0.07656000057856242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,10240,0.015798222687509324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,16384,0.030105776256985132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,8192,0.013975110318925647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,12288,0.02420799930890401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,7168,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,10240,0.022129777404997084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,8192,0.020236444142129686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,5120,0.010019555687904358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,7168,0.018553778529167175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,4096,0.009304000271691216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,6144,0.017982222967677645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,3584,0.008328888979223039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,3072,0.007600000335110559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,5120,0.01648355523745219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,4096,0.014821334017647637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,3584,0.01480977733929952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,2048,0.0057546666098965546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,3072,0.014117333624098035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,1536,0.004875555634498596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,2560,0.013752889302041797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,1024,0.004231111043029361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,2048,0.013429332938459186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,768,0.003879111260175705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,1536,0.013080889152155982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,3072,32,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,512,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,1024,0.0124195557501581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,256,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,128,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,768,0.01277599980433782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,65536,0.0653031137254503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,512,0.012125333150227865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,64,0.002842666581273079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,256,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,128,0.01107911103301578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,65536,0.053471999035941235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,64,0.011437333292431302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2560,32,0.012084444363911947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,51200,0.04331377810902066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,16384,0.018744889232847426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,12288,0.01479644411140018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,65536,0.09337688816918267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,6144,0.011053333679835001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,51200,0.07476977507273357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,16384,0.029548443026012842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,12288,0.02403555479314592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,7168,0.011736888852384357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,10240,0.021958221991856892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,8192,0.019641778535313077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,6144,0.01090311093462838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,2560,0.006917333437336816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,5120,0.010021333065297868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,4096,0.008606221940782335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,7168,0.018578666779730055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,3584,0.007680888805124495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,5120,0.015796444482273526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,3072,0.006748444504208035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,3584,0.014517333772447375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,2560,0.006280000011126201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,3072,0.014113777213626437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,2048,0.0052284445199701525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2560,32,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,2048,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,1536,0.004880889008442561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,1536,0.013413333230548434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,1024,0.0041866666740841335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,10240,0.014174222946166992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,768,0.0038328886859946777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,8192,0.01329422245422999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,512,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,768,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,256,0.0032026666320032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,512,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,128,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,6144,0.016297777493794758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,64,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,4096,0.014856000741322836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,2048,32,0.0028799999919202593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,128,0.011426666544543372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,64,0.01074222226937612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,65536,0.04172977805137634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,32,0.01110311100880305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,51200,0.033462223079469465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,16384,0.015064888530307345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,2560,0.013785777820481194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,65536,0.09010399712456597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,12288,0.014512888259357877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,51200,0.07249866591559516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,10240,0.013136000268989138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,16384,0.029121776421864826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,8192,0.012112889024946423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,7168,0.011392888923486074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,12288,0.023345778385798138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,6144,0.010936000280910067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,10240,0.021537777450349595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,8192,0.018920888503392536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,5120,0.009711110757456886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,7168,0.01755644381046295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,4096,0.00905600024594201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,3584,0.007273777491516537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,1024,0.012520000338554382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,5120,0.015636444091796875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,3072,0.006575999988449945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,4096,0.014821334017647637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,2560,0.005899555567238066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,3584,0.014490667316648694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,2048,0.005251555393139522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,1536,0.004875555634498596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,3072,0.013815999858909182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,1024,0.00387999994887246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,2560,0.01368444412946701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,2048,0.012796444197495779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,2048,256,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,1536,0.013344888885815939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,512,0.0035706667436493766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,256,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,768,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,128,0.0028817777832349143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,512,0.012411555482281579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,256,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,32,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,128,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,64,0.011719110939237805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,65536,0.03075466553370158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,32,0.011152000062995486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,51200,0.024901333782407973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,16384,0.012903999951150684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,65536,0.08734489149517483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,51200,0.06891466511620416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,12288,0.010669333239396414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,16384,0.02878311276435852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,10240,0.011226666470368704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,6144,0.016182222300105624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,8192,0.012473777764373355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,7168,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,12288,0.02241955531968011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,10240,0.020933333370420668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,6144,0.01108444482088089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,8192,0.018232888645595975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,5120,0.009955555200576782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,7168,0.017518222332000732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,6144,0.016189333465364244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,5120,0.015164444843928019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1536,768,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,3584,0.0069155556460221606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,3072,0.0063680000603199005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,2560,0.005892444401979446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1536,1024,0.012453333371215396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,2048,0.006355555521117316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,1536,0.005600888695981767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,3584,0.014189332723617554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,3072,0.013810666898886362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,1024,0.004552888787455029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,2560,0.013783999615245394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,768,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,2048,0.013067555924256643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,512,0.0035342222286595237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,1536,0.012791111237472959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,256,0.003192000091075897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,128,0.002883555574549569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,1024,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,768,0.012661333713266583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,512,0.012094222009181976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,64,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,256,0.011360000405046674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,32,0.002842666581273079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,128,0.011052444577217102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,65536,0.02610933283964793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,64,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,51200,0.021555556191338435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,32,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,16384,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,12288,0.010015111002657149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,65536,0.08510400189293756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,10240,0.009927111367384592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,51200,0.06675377819273207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,16384,0.027922666735119287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,8192,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,12288,0.022335999541812476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,7168,0.009654222263230218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,6144,0.008302222523424361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,10240,0.01995377739270528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,8192,0.018200889229774475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,5120,0.00885688927438524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,1024,4096,0.008958222137557136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,4096,0.007641777396202087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,7168,0.01755199995305803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,3584,0.007076444725195567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,6144,0.016494222813182406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,3072,0.00628355559375551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,2560,0.005889777921968036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,1024,4096,0.014787554740905762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,2048,0.005223111146026188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,3584,0.014521777629852295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,1536,0.0046942221621672315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,2560,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,1024,0.00388711111413108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,2048,0.013139555851618448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,768,0.003830222205983268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,1536,0.013157332936922709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,512,0.003528888854715559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,1024,0.012074666718641916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,256,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,768,0.01239733315176434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,128,0.0028808888875775864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,512,0.012431110772821637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,64,0.002558222247494592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,256,0.011513777905040316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,768,32,0.002797333316670524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,128,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,65536,0.022506665852334764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,64,0.011746666497654386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,32,0.011078221930397881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,51200,0.018153778380817838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,16384,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,65536,0.0827253328429328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,51200,0.06439644760555692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,12288,0.010749333434634738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,16384,0.02643022272321913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,10240,0.010382222632567087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,8192,0.009649777577983009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,4096,0.014442667365074158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,12288,0.02164622147878011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,7168,0.008975110948085785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,10240,0.020263999700546265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,6144,0.007839110990365347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,8192,0.018242667118708294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,5120,0.00795199970404307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,4096,0.0076044441925154785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,7168,0.01686311099264357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,3584,0.006956444846259222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,6144,0.016340444485346477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,5120,0.015523556205961438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,3072,0.006416888700591193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,4096,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,3584,0.014576888746685453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,2048,0.005264889034960005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,2560,0.01346666696998808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,1536,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,2048,0.012808000048001608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,1024,0.0038746665749284956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,1536,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,768,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,1024,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,512,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,768,0.01221244451072481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,256,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,512,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,128,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,5120,0.015400888191329109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,64,0.002532444480392668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,256,0.01145600030819575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,768,3072,0.013807999591032663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,32,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,128,0.010739555789364709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,65536,0.019270223047998216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,64,0.011406222151385413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,51200,0.016864889197879367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,16384,0.009885333478450775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,65536,0.07882755332522921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,512,2560,0.005557333429654439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,51200,0.06317066484027438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,12288,0.010033778018421596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,10240,0.009152889251708984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,16384,0.026047999660174053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,3072,0.014130666851997375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,8192,0.008616888688670265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,7168,0.008253333469231924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,12288,0.021644444929228887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,10240,0.01971733404530419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,8192,0.018391110830836825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,5120,0.008027555214034187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,7168,0.016813332835833233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,4096,0.007311999797821045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,3584,0.0069217777086628815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,5120,0.015512888630231222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,3072,0.006280000011126201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,3584,0.01408622165520986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,2560,0.0057884446448749965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,3072,0.014138667119873894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,2048,0.005000000198682149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,2560,0.013462222284740873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,1536,0.004548444516128964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,2048,0.013458666702111563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,1024,0.0038782221575578055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,512,32,0.011423110961914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,1536,0.012552888856993781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,768,0.003568888952334722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,512,0.0035342222286595237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,1024,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,256,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,768,0.012117333710193634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,512,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,128,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,64,0.002542222125662698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,6144,0.00867377801073922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,256,0.011742221812407175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,256,32,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,128,0.011419555379284753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,65536,0.015098666151364645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,64,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,51200,0.014818666709793938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,6144,0.015947555502255756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,32,0.011739555332395764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,16384,0.009364444348547194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,12288,0.009740444521109263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,10240,0.009024000002278222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,65536,0.07764355341593425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,8192,0.00796622203456031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,256,4096,0.014108444253603617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,51200,0.061230222384134926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,16384,0.02606222199069129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,7168,0.00903911143541336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,12288,0.021611554755104914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,6144,0.008356444537639618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,10240,0.02017866737312741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,5120,0.00796088907453749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,4096,0.007266666326257918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,3584,0.007048000064161088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,8192,0.017903111047214933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,3072,0.006636444479227066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,7168,0.016561778055297006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,5120,0.015121777852376303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,4096,0.014811555544535318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,2048,0.004920888692140579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,3584,0.014118222726715935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,1536,0.004250666747490565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,3072,0.013812444276279874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,1024,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,2560,0.01313866674900055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,768,0.0035617777870761026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,2048,0.013470222552617392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,512,0.003334222154484855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,1536,0.012516444755925072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,256,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,1024,0.012167111039161682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,128,0.002562666725781229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,64,0.002519999941190084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,512,0.011821333732869891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,256,0.011371555427710215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,128,0.011392888923486074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,65536,0.01648622254530589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,64,0.011759111450778114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,51200,0.014840000205569796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,16384,0.009327111144860586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,65536,0.07659644550747342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,51200,0.059345775180392794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,12288,0.009645333720578088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,16384,0.02609599961174859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,10240,0.008953777452309927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,8192,0.00815644446346495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,12288,0.021800888909233943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,7168,0.007653333246707916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,10240,0.01961955593691932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,8192,0.017872888180944655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,6144,0.006981333096822103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,5120,0.006621333460013072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,6144,0.015676443775494892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,7168,0.01720266706413693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,128,2560,0.005562666803598404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,4096,0.00628977765639623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,6144,0.016172443826993305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,3584,0.005964444329341252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,3072,0.0064106666379504735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,4096,0.014835556348164877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,2560,0.006257777826653586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,3072,0.013434666726324292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,768,0.01205599970287747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,2048,0.005577777822812398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,1536,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,2560,0.013458666702111563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,1024,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,2048,0.012543111211723752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,1536,0.01272266689274046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,768,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,128,32,0.010776888993051318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,768,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,256,0.0026444445053736367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,512,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,128,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,256,0.011183111204041375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,64,0.002471999989615546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,128,0.010377777947319878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,32,0.0024746666765875286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,64,0.010363555616802638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,65536,0.016167110866970487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,32,0.010685332947307162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,5120,0.014836443795098199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,51200,0.015170666906568738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,16384,0.009329777624871995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,3584,0.014317333698272705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,65536,0.07523022095362346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,12288,0.009296000003814697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,51200,0.05922044648064507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,10240,0.008919110728634728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,16384,0.02586666742960612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,8192,0.007928888830873702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,7168,0.007304888632562425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,10240,0.019682667321628995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,8192,0.017623111605644226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,6144,0.0069351109365622205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,5120,0.006641777853171031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,7168,0.016878222425778706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,64,512,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,64,1024,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,4096,0.006280888699822956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,3584,0.006311111152172089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,3072,0.006613333192136552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,6144,0.015806222955385845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,2560,0.006245333287451003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,4096,0.014164444473054675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,3584,0.014426666829321118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,2048,0.005879111174080107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,3072,0.014095111025704278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,2560,0.013408888545301227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,2048,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,1536,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,768,0.003569777641031477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,1024,0.0121742222044203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,512,0.003152888889114062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,768,0.01275199982855055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,256,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,512,0.0120319997270902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,128,0.0027911110470692315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,256,0.011733333269755045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,64,0.00249777775671747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,128,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,12288,0.021369778447681006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,32,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,64,0.011423110961914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,32,0.010690666735172272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,81,32,5120,0.01482399966981676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,1536,0.0041946665280395085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,81,32,1024,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,16384,0.36019288169013125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,16384,0.21571200423770479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,51200,0.6330240037706163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,12288,0.27081865734524196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,12288,0.15957155492570665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,51200,1.1164977815416124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,10240,0.218596445189582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,10240,0.1361502276526557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,8192,0.11668799983130561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,8192,0.1760880019929674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,7168,0.1537875599331326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,7168,0.09950400061077541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,12288,0.226090669631958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,6144,0.13140800264146593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,16384,0.29754577742682564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,10240,0.19225688775380453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,8192,0.157094226943122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,6144,0.08781066868040298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,5120,0.11385511027442084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,4096,0.09342666467030843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,5120,0.07494933075375028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,7168,0.14080444971720377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,3584,0.0788773364490933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,4096,0.0630213353368971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,3072,0.06995111041598849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,3584,0.05749422311782837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,3072,0.05110044280687968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,6144,0.1248213317659166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,4096,0.09344889058007134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,5120,0.11032266749276055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,3584,0.08560799890094334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,2560,0.045520888434516064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,2048,0.04815999997986687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,3072,0.07958488994174533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,2048,0.04014666544066535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,2560,0.07023021909925672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,1536,0.043940444787343345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,1024,0.02829422222243415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,1536,0.062096887164645724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,1024,0.031446221801969744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,768,0.021485333641370136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,768,0.025419554776615564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,512,0.01443555619981554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,768,0.04397066765361362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,512,0.038430223862330117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,512,0.022486221459176805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,256,0.009301332963837517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,2560,0.05958933300442166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,128,0.007797333101431529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,256,0.01925155520439148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,256,0.03389422098795573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,64,0.006638222270541721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,1536,0.03756533397568597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,128,0.028528001573350694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,65536,32,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,64,0.01755644381046295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,32,0.022261333134439256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,2048,0.06372088856167264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,1024,0.05197599861356947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,65536,0.6602977646721734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,51200,0.5051164627075195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,51200,0.8552293247646756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,65536,1.0841333601209853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,65536,128,0.017512000269360013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,16384,0.27545155419243705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,65536,51200,0.9045599831475152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,12288,0.2083973354763455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,16384,0.17330311404334175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,10240,0.17416532834370932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,12288,0.12840622001224095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,8192,0.14152533478207058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,10240,0.11039288838704427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,8192,0.09460977713267009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,7168,0.12514489226871067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,8192,0.13626133071051702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,16384,0.24836977322896323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,10240,0.16296088695526123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,7168,0.081423110432095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,6144,0.10752266645431519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,6144,0.0722115569644504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,5120,0.09146310885747273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,5120,0.061908443768819175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,4096,0.07445422146055433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,7168,0.12258399857415093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,6144,0.10969866646660699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,3584,0.06610400146908231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,5120,0.09626577960120307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,3584,0.04784799946679009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,4096,0.08417955372068618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,3072,0.05800177653630575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,12288,0.1922311120563083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,3584,0.0764897796842787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,3072,0.04312088754442003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,2560,0.04853511187765333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,2048,0.03968088825543722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,3072,0.06988977723651461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,2560,0.03902755512131585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,1536,0.031587554348839655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,2560,0.06401155392328899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,2048,0.03480888737572564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,1024,0.02330222229162852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,2048,0.05692088603973389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,1536,0.051220443513658315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,768,0.017151110702090792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,1024,0.026550221774313185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,1024,0.04733599887953865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,512,0.012352888782819113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,4096,0.05292000042067634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,768,0.039579557047949895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,256,0.008279110822412703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,512,0.035904000202814736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,128,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,512,0.020933333370420668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,768,0.022666666242811415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,256,0.017144888639450073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,64,0.00453599997692638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,51200,32,0.004859555512666702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,128,0.026708443959554035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,128,0.015824889143308003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,64,0.01614755557643043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,32,0.01904977858066559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,65536,0.3264053397708469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,51200,0.7550729115804037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,65536,0.26160621643066406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,51200,0.25032711029052734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,16384,0.0823999974462721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,51200,1536,0.03616266780429416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,51200,0.2024737728966607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,16384,0.07534044318728976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,12288,0.06538489129808214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,12288,0.05648089117474026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,65536,0.9861937628851997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,10240,0.05412266651789347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,51200,256,0.03081866767671373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,8192,0.04626133375697666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,16384,0.08365955617692734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,12288,0.06679022312164307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,10240,0.051832887861463756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,7168,0.03945599993069967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,10240,0.059345775180392794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,8192,0.04353333181805081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,6144,0.034330666065216064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,7168,0.03949955436918471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,8192,0.05355111095640394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,6144,0.03480622172355652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,5120,0.029792000850041706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,7168,0.048842665221956044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,4096,0.026055110825432673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,6144,0.046282665597067944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,5120,0.03115733464558919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,3584,0.021869333253966436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,4096,0.027460444304678176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,5120,0.042308443122439914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,4096,0.03861066699028015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,3072,0.019256000717480976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,3584,0.02569777766863505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,51200,0.2001671128802829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,3584,0.0359555549091763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,65536,0.2522328959570991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,2048,0.013401777380042605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,3072,0.03613244493802389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,1536,0.010762666662534079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,2560,0.0326275560590956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,2048,0.031048887305789526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,2048,0.01960355540116628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,1024,0.008651555412345463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,1536,0.0203128887547387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,1536,0.03018488817744785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,768,0.007300444775157505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,1024,0.02815377712249756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,1024,0.016530666086408827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,512,0.00572533326016532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,768,0.02612177696492937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,768,0.015561777684423657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,256,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,512,0.014508444401952954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,128,0.003616888903909259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,256,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,256,0.022636445032225713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,64,0.003540444291300244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,128,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,128,0.019559999306996662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,32,0.003547555456558863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,64,0.013438222308953604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,32,0.013764444324705334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,16384,2560,0.01642933322323693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,65536,0.25000090069240993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,3072,0.023040889037979975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,65536,0.2106391059027778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,16384,2560,0.021143111917707656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,16384,0.07103200091256036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,51200,0.19838399357265898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,12288,0.055247111452950366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,51200,0.16259911325242785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,16384,0.06259822183185153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,10240,0.04620711008707682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,12288,0.04707733458942837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,16384,512,0.023024888502226934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,16384,0.07620977693133883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,12288,0.061531556977166064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,8192,0.038896001047558255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,7168,0.033977776765823364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,8192,0.03685599896642897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,10240,0.05501866671774122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,8192,0.049421333604388766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,7168,0.045787556303872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,6144,0.029792000850041706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,5120,0.025785777303907607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,51200,0.1774266693327162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,6144,0.04334400097529093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,4096,0.022184888521830242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,5120,0.026307556364271376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,65536,0.22258665826585558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,5120,0.038889778984917536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,3584,0.019090667366981506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,4096,0.023296000228987798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,4096,0.03645066751374139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,3072,0.016697777642144095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,3584,0.02184533410602146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,3584,0.03417244553565979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,2560,0.014078223043017916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,3072,0.020571556356218126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,3072,0.03442222211096022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,10240,0.041498667663998075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,2048,0.012315555579132505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,1536,0.01036444471942054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,2560,0.03252089023590088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,2560,0.019159111711714003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,2048,0.01826400061448415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,1024,0.008542222281297049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,1536,0.029010666741265193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,1536,0.01796533332930671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,6144,0.029558221499125164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,768,0.0069253332912921906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,1024,0.02758666707409753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,1024,0.015847111741701763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,768,0.02569955587387085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,768,0.0144533332851198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,256,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,512,0.013774221969975365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,512,0.02332088847955068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,128,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,256,0.022364444202846948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,256,0.012740444805887012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,64,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,128,0.012063999970753988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,128,0.020389333367347717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,32,0.003519999898142285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,64,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,32,0.014087999860445658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,65536,0.2174746725294325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,65536,0.201401776737637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,12288,2048,0.030817776918411255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,51200,0.17064978016747367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,16384,0.05676533116234673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,12288,7168,0.0326257778538598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,51200,0.1569653352101644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,12288,0.043692443105909556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,12288,512,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,10240,0.03751733236842685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,16384,0.05970578061209785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,12288,0.04528444343143039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,16384,0.07277244329452515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,8192,0.031537777847713895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,12288,0.05951733059353299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,10240,0.04036533170276218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,7168,0.02782577938503689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,8192,0.03541600041919284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,10240,0.053525331947538585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,7168,0.03194133440653483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,6144,0.02456533412138621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,8192,0.048567109637790255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,5120,0.021739555729760066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,7168,0.044128888183169894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,4096,0.017828444639841717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,6144,0.028079112370808918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,65536,0.21336889266967773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,6144,0.04247644543647766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,3584,0.01643822259373135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,51200,0.17083466053009033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,5120,0.03860444492763943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,3072,0.01460800071557363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,4096,0.022456000248591106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,4096,0.03587199913130866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,2560,0.012696888711717395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,3584,0.021560889151361253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,3584,0.03489155570665995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,2048,0.011490667031870948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,3072,0.020202666521072388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,3072,0.03315733207596673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,2560,0.01902755598227183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,2560,0.03147644466824002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,1536,0.009336888790130615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,1024,0.007932444413503012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,2048,0.01789155602455139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,1536,0.029410666889614526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,1536,0.017450667089886136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,768,0.006600889066855113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,1024,0.014434667097197639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,512,0.005231110999981563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,1024,0.024711999628278945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,256,0.004182222402758068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,768,0.02467022173934513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,768,0.013889777991506787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,512,0.024381332927280005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,512,0.013090666797426013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,128,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,64,0.0034933334423436057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,256,0.0226239992512597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,10240,32,0.0034773333205117118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,128,0.01902577777703603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,128,0.012605333493815528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,64,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,32,0.013117333253224691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,65536,0.1730142169528537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,65536,0.1577191087934706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,5120,0.025568000144428674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,51200,0.13447288672129312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,16384,0.04747200012207031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,51200,0.12198132938808864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,12288,0.03772888912094964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,16384,0.04901777704556783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,16384,0.06804977522956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,12288,0.03734133309788174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,10240,0.0314684444003635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,12288,0.05681688918007744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,10240,0.03359199894799127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,8192,0.026875555515289307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,10240,0.051073776351081006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,10240,256,0.01236977759334776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,51200,0.15719555483924016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,65536,0.1960808833440145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,8192,0.030029333300060693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,8192,0.04645511176851061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,6144,0.020603555772039626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,7168,0.02619022296534644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,7168,0.042711999681260854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,5120,0.017749332719379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,6144,0.023991111252042983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,6144,0.04033333394262526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,4096,0.014832889040311178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,5120,0.038110223081376814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,3584,0.01316088851955202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,4096,0.03555644551912943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,4096,0.020272889071040683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,3072,0.012019555601808759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,3584,0.019340443942281935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,3584,0.033788445923063494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,2560,0.010657777388890585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,10240,2048,0.03014755580160353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,3072,0.018094221750895183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,2048,0.009296889106432596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,3072,0.03322844372855292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,2560,0.030990223089853924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,2560,0.017272889614105225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,1536,0.007909333540333642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,2048,0.03090311090151469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,2048,0.016359999775886536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,1024,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,1536,0.015560888581805758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,1536,0.02665155629316966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,768,0.004885333279768626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,7168,0.023099554909600153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,1024,0.013739555246300168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,512,0.004210666649871402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,768,0.024695111645592585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,768,0.013404444687896304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,256,0.003559111307064692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,512,0.012738666600651212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,512,0.02299733294381036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,128,0.0032400000426504347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,256,0.02232711182700263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,256,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,64,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,128,0.01887999971707662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,128,0.01145244472556644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,5120,0.02168088820245531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,64,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,8192,32,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,65536,0.15182133515675864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,65536,0.15486755636003283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,16384,0.0474275549252828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,51200,0.12197421656714545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,16384,0.04748622245258755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,12288,0.034506665335761175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,16384,0.06775999731487699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,8192,1024,0.025128000312381323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,10240,0.028740445772806805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,12288,0.036504000425338745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,51200,0.1553999980290731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,12288,0.055958224667443164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,65536,0.193101339870029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,8192,0.025034666061401367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,10240,0.0325564444065094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,7168,0.021686222818162706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,10240,0.050382223394181996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,6144,0.01886488828394148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,8192,0.02879555688963996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,8192,32,0.0031439999325407874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,8192,0.04515377680460612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,7168,0.02566755480236477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,5120,0.016723554995324876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,7168,0.04214222232500712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,4096,0.014377777775128683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,6144,0.02342044479317135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,6144,0.040163556734720864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,3584,0.012709333664841123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,5120,0.02148977749877506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,4096,0.01979822251531813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,3072,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,3584,0.018817777434984844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,3584,0.033538666036393903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,2560,0.010117332968446944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,3072,0.03197244471973843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,3072,0.018202667435010273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,2048,0.008847999903890822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,2560,0.016864889197879367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,2560,0.030237333642111883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,1536,0.007621333003044128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,2048,0.015344889627562629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,2048,0.02921066681543986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,1024,0.005479111025730769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,1536,0.026766222384240892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,1536,0.015150222513410779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,768,0.004571555389298333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,1024,0.013815110756291283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,1024,0.02403822210099962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,512,0.0042151109211974675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,768,0.023994666006830003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,768,0.013110222087966071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,256,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,512,0.012712889247470431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,512,0.022985777921146814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,128,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,256,0.012096888489193387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,256,0.020967110991477966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,64,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,128,0.011527111132939657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,128,0.018533334136009216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,32,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,5120,0.03804888990190294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,64,0.011413333316644033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,7168,51200,0.12062488661872016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,7168,32,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,65536,0.1255413293838501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,51200,0.10149688853157891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,65536,0.14800000190734863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,51200,0.11591022544436985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,16384,0.040820442967944674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,12288,0.03355733222431607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,16384,0.04643644558058845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,16384,0.06701599889331393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,12288,0.03565866748491923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,10240,0.02948444419436985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,12288,0.05577244361241659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,8192,0.02274399995803833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,10240,0.03190133306715224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,51200,0.15457155969407824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,65536,0.19166221883561876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,10240,0.04988266693221199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,7168,0.02128977742460039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,8192,0.027456000447273254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,6144,0.018214222457673814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,8192,0.0455297761493259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,7168,0.02493600050608317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,7168,0.04203288753827413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,5120,0.01465777721669939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,6144,0.03940355446603563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,6144,0.023352889551056757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,4096,0.013091555900043912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,3584,0.01149777736928728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,5120,0.03677599959903293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,5120,0.020847110284699336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,4096,0.03461688756942749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,3072,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,4096,0.019256000717480976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,2560,0.009641778137948778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,3584,0.03231822119818793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,3584,0.018578666779730055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,3072,0.03314666615592109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,3072,0.017838221457269456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,2048,0.008252444366614023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,1536,0.007259555160999298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,2560,0.029896001021067303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,2048,0.015190222197108798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,1024,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,1536,0.025736000802781846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,1024,0.02444444431198968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,1024,0.014151111245155334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,768,0.00479288895924886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,768,0.013449778159459433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,512,0.0038773334688610504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,512,0.01276711126168569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,7168,4096,0.03554577628771464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,512,0.023732443650563557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,256,0.003572444534964032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,128,0.0031555555760860443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,256,0.01241422196229299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,256,0.022311111291249592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,64,0.0028826666788922418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,2560,0.016418667303191293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,128,0.019688889384269714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,128,0.011748444702890186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,6144,32,0.0028906667398081887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,2048,0.02924799919128418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,64,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,1536,0.014930667148696052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,6144,32,0.012874667015340594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,65536,0.11818222204844157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,51200,0.09235911236868964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,16384,0.03460266523891025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,51200,0.11386399798923069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,16384,0.045364442798826426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,6144,768,0.023592889308929443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,12288,0.029507554239696924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,10240,0.025427555044492085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,16384,0.06663999954859416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,12288,0.03445600138770209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,12288,0.05505422088834974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,8192,0.022319111559126113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,51200,0.1534737745920817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,10240,0.0494026674164666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,65536,0.18934755855136445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,7168,0.019944889677895438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,6144,0.015084443820847405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,8192,0.026499556170569524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,8192,0.04471288786994087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,7168,0.04103022151523166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,7168,0.02465244465404087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,5120,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,6144,0.022996443841192458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,6144,0.04016710983382331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,4096,0.0118568887313207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,5120,0.020854221449957952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,5120,0.03660800059636434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,3584,0.010599111517270407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,4096,0.019262222780121695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,3072,0.010225777824719747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,3584,0.01869333287080129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,3584,0.03331911232736375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,2560,0.008967111508051554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,65536,0.14437599976857504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,3072,0.01733955575360192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,3072,0.031088001198238794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,2048,0.008203555312421586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,2560,0.016480889585283067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,2560,0.030532442861133154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,1536,0.006599111275540457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,2048,0.027422222826215956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,2048,0.014431110686726041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,1024,0.005202666752868229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,1536,0.026072000463803608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,768,0.004869333157936732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,1024,0.01333333303531011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,1024,0.025359110699759588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,10240,0.030996445152494643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,768,0.013097777962684631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,512,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,256,0.003560888684458203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,512,0.023383110761642456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,256,0.022325333621766832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,128,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,4096,0.03471111257870992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,128,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,128,0.019925332731670804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,64,0.003192000091075897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,32,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,64,0.012106666962305704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,65536,0.0878960026635064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,32,0.012103999654452005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,51200,0.07277777459886339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,1536,0.014153778553009033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,65536,0.10399111111958821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,16384,0.02958400050799052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,5120,512,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,51200,0.08257066541247897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,5120,768,0.023689778314696416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,12288,0.02443555494149526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,16384,0.03317155440648397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,16384,0.06612888971964519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,10240,0.021893334057595994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,12288,0.02625244524743822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,65536,0.1885288953781128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,8192,0.01644088824590047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,5120,256,0.011774222056070963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,51200,0.152895106209649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,10240,0.02331377731429206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,10240,0.04863644308514065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,7168,0.014450665977266101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,6144,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,8192,0.04348799917432997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,8192,0.021606221795082092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,5120,0.011736888852384357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,7168,0.04144533475240072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,7168,0.019814221395386588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,4096,0.010323555933104621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,6144,0.039461334546407066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,6144,0.018940443793932598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,3584,0.008992888861232335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,5120,0.01756355497572157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,5120,0.03603911068704393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,3072,0.008381333616044786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,4096,0.01613333324591319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,4096,0.03484266665246751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,2560,0.007613333563009898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,3584,0.015810666812790763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,2048,0.006800000038411882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,3072,0.014831999937693277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,2560,0.029185778564876978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,1536,0.005335111171007156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,2048,0.026751110951105755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,2048,0.013415999710559845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,1024,0.004530666602982415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,1536,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,1536,0.026084444589085046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,768,0.003962666624122196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,1024,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,1024,0.024000888069470722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,512,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,768,0.012427555190192329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,12288,0.05482133229573568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,512,0.012049777640236748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,512,0.022631999519136217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,256,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,128,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,256,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,128,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,128,0.019645333290100098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,64,0.0029235554652081597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,3584,0.03323555654949612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,4096,32,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,3072,0.029119110769695703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,2560,0.013838222457302941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,64,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,65536,0.0785635577307807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,4096,32,0.01241422196229299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,51200,0.06333333253860474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,65536,0.10129421949386597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,51200,0.08065866761737399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,16384,0.02682755556371477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,768,0.023657777243190344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,16384,0.03154666556252374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,12288,0.02108088963561588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,16384,0.06612888971964519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,65536,0.18819733460744223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,51200,0.15193511380089655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,10240,0.01819022165404426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,8192,0.017549332645204332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,12288,0.02537155482504103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,12288,0.05424799852901035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,4096,256,0.020928000410397846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,7168,0.015475556254386902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,10240,0.048390222920311816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,10240,0.022985777921146814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,8192,0.043976889716254346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,6144,0.01459822224246131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,8192,0.021032000581423443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,7168,0.019408888287014432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,5120,0.01131199962562985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,7168,0.04105510976579454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,4096,0.00996088898844189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,6144,0.018529777725537617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,6144,0.03965866565704346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,3584,0.008938666847017076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,5120,0.017292444904645283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,5120,0.03638844357596503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,4096,0.015842666228612263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,4096,0.03376177615589566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,2560,0.007287110719415877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,3584,0.01551999979548984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,3584,0.032073779238594904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,3072,0.01500888831085629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,2048,0.006271111054552927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,3072,0.029286222325430974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,1536,0.005277333160241445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,2560,0.029322667254341975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,2560,0.013746666411558786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,2048,0.027059555053710938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,2048,0.0131217779384719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,1536,0.013414222333166333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,1536,0.026855111122131348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,768,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,1024,0.012720888687504662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,512,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,768,0.0236471113231447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,768,0.012612444659074148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,256,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,512,0.012530666258600024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,128,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,256,0.022146667043368023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,256,0.011424000064531961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,64,0.002874666617976295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,128,0.0196142229768965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,32,0.0028497777465316984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,64,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,65536,0.06929510831832886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,3072,0.008120888637171851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,65536,0.09929955667919582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,51200,0.05673244264390734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,1024,0.023974221613672044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,51200,0.07841600312127008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,65536,0.18819110923343232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,16384,0.022506665852334764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3584,512,0.022675555613305833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,16384,0.03116977877087063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,12288,0.01868266695075565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,16384,0.06549777587254842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,10240,0.016192000773217943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,51200,0.15174667040506998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,12288,0.02455733385350969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,128,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,12288,0.053723557127846606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,8192,0.014324444863531323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,7168,0.013727111121018728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,10240,0.04808444446987576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,8192,0.020624000165197585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,8192,0.04359289010365804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3584,32,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,6144,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,5120,0.01126844435930252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,7168,0.01937599976857503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,7168,0.040363556808895536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,4096,0.009920000202125972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,6144,0.03927200039227804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,5120,0.036766221125920616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,5120,0.01717688971095615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,3584,0.008617777791288164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,4096,0.03361422154638503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,4096,0.015843555331230164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,3072,0.008368888662921058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,3584,0.014947555131382413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,3584,0.030889779329299927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,2560,0.007463110817803278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,3072,0.014134221606784396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,3072,0.02942488922013177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,2048,0.006519111080302133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,2560,0.013909333282046847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,2048,0.013749333719412485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,2048,0.02777422302299076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,1536,0.0053324442770746015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,1536,0.025705777936511572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,1024,0.004242666479614046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,10240,0.022450667288568284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,1024,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,1024,0.024108444650967915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,768,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,6144,0.01807466646035512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,512,0.0035297779573334586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,768,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3584,1024,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,256,0.0033395555284288195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,512,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,512,0.022289777795473736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,128,0.002855111120475663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,256,0.02160800000031789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,256,0.011357333097192975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,64,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,128,0.011149333582984077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,3072,32,0.0028808888875775864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,128,0.019151111443837483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,2560,0.028819554381900366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,64,0.011423110961914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,65536,0.06012711260053846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,32,0.011026666396194033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,51200,0.04871911141607496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,65536,0.09483822186787923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,3072,1536,0.013390222357379066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,51200,0.07397688759697808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,16384,0.030341333813137476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,12288,0.018177777528762817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,16384,0.0652515557077196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,51200,0.1516586674584283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,65536,0.1871955527199639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,10240,0.015487111277050443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,12288,0.05357244279649523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,12288,0.024118221468395654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,8192,0.013918222652541267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,7168,0.013360000318951078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,10240,0.0479964448346032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,8192,0.04298311140802172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,8192,0.020297777321603563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,6144,0.011325333681371478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,7168,0.01925066610177358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,7168,0.04088177614741855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,5120,0.010276444256305695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,6144,0.017394666870435078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,6144,0.03875199953715006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,4096,0.009174221919642555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,5120,0.036518222755855985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,5120,0.01643022232585483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,3584,0.008262222011884054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,4096,0.014765333798196582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,4096,0.031903111272388034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,3072,0.007583111524581909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,3584,0.014440889159838358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,2560,0.006911110960774952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,3072,0.02983733349376255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,3072,0.014092443717850579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,2048,0.006136000156402588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,16384,0.020216888851589628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,2560,0.013445333474212222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,2560,0.02812888887193468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,1536,0.004816888935036129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,2048,0.026392888691690233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,2048,0.01313688854376475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,1024,0.004204444587230682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,1536,0.02507200009293026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,1536,0.012758221891191272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,768,0.0038862224254343244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,1024,0.024341333243581984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,512,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,768,0.02330488959948222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,768,0.012116444607575735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,10240,0.02228533393806881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,512,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,512,0.02234755622016059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,128,0.002874666617976295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,256,0.01163644426398807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,256,0.02130577796035343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,64,0.0028817777832349143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,128,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,128,0.018358222312397428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,32,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,64,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,65536,0.04911199874348111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,32,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2560,3584,0.031207998593648274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,51200,0.040786667002571955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,65536,0.09277066919538711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,51200,0.07417955663469103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,65536,0.18688178062438965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,16384,0.01763288842307197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2560,1024,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,16384,0.029511110650168523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,16384,0.06504178047180176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,12288,0.015169777803950839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,10240,0.013861333330472311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,3072,768,0.0240320000383589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,12288,0.023800889650980633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,12288,0.05371555685997009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,8192,0.012799999780125089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,10240,0.021772444248199463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,10240,0.04793955551253425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,7168,0.01167377746767468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,8192,0.020241777102152508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,8192,0.04298399885495504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,6144,0.011054221954610614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,7168,0.040103111002180315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,7168,0.018567999203999836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,5120,0.00996800015370051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,6144,0.016875555117925007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,6144,0.039289779133266874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,4096,0.010481778118345471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,5120,0.016494222813182406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,5120,0.033942222595214844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,3584,0.009291555318567488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,4096,0.031735112269719444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,3072,0.008951110972298516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,3584,0.029863999949561224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,3072,0.01390044391155243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,3072,0.029465778006447688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,2560,0.008052444292439355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,51200,0.15215555826822916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,2560,0.027401778433057997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,2560,0.013487111363146039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,2048,0.0052675555149714155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,1536,0.004880889008442561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2560,256,0.0032177778581778207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,2048,0.02677244444688161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,2048,0.013086222112178802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,1024,0.004184000194072723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,1536,0.01278222186697854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,1536,0.025785777303907607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,768,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,1024,0.025015999873479206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,512,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,768,0.023335999912685815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,768,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,256,0.0031999999450312722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,512,0.012063110868136087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,512,0.02252977755334642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,128,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,256,0.011527111132939657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,64,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,4096,0.014945778581831189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,128,0.019898666275872123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,2048,32,0.002842666581273079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,3584,0.014431110686726041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,65536,0.0385519994629754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,64,0.011063111325105032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,32,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,51200,0.030167112747828167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,65536,0.09029244714313084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,16384,0.018554665976100497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,51200,0.07219733132256402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,65536,0.18808889389038086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,51200,0.15181599722968206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,12288,0.016181333197487723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,16384,0.029100444581773546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,16384,0.06516800324122111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,10240,0.014254222313563028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,12288,0.023132445083724126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,10240,0.021548445026079815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,1024,0.012545777691735161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,10240,0.04758933186531067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,7168,0.01198933356338077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,8192,0.0417848891682095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,8192,0.01889866590499878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,6144,0.011063111325105032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,7168,0.01755644381046295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,7168,0.03955466548601786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,5120,0.009684444301658207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,2048,256,0.022279999322361414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,6144,0.03633155425389608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,2048,128,0.011357333097192975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,4096,0.008274666965007782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,5120,0.03422933485772874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,4096,0.014492443866199918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,3584,0.007313778003056844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,4096,0.031312889522976346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,3072,0.006696888970004187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,3584,0.030135111676322088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,3584,0.014152000347773233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,2560,0.005981333139869902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,3072,0.013821333646774292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,3072,0.029170665476057265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,2048,0.0052728888889153796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,2560,0.028416001134448584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,2560,0.013424889081054263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,1536,0.005554666535721884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,2048,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,2048,0.026735110415352717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,12288,0.05371110969119602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,1024,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,1536,0.01273333364062839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,8192,0.012805333567990197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,1536,0.02472355630662706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,768,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,512,0.0032213332338465583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,1024,0.025037333369255066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,1024,0.012512889173295764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,768,0.023349333140585158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,768,0.012049777640236748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,256,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,128,0.003019555575317807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,512,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,512,0.022954665952258643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,64,0.002597333242495855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,256,0.020612445142534044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,256,0.011411555939250521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1536,32,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,128,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1536,128,0.018918222851223417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,65536,0.02863466739654541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,64,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,32,0.010703110860453712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,51200,0.02602133320437537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,5120,0.015508444772826301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,16384,0.012844444149070315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,65536,0.08653689093059963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,12288,0.010474666953086853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,51200,0.06737066639794244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,16384,0.02865866820017497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,65536,0.1883875528971354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,16384,0.06391288836797078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,10240,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,51200,0.151344895362854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,8192,0.012773333324326409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,12288,0.023053333163261414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,10240,0.04693422383732266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,7168,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,10240,0.02073955535888672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,8192,0.018254222141371835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,8192,0.040956444210476346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,6144,0.01147822207874722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,5120,0.009695111049546136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,7168,0.039292444785436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,7168,0.01716977854569753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,6144,0.035995556248558894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,4096,0.007948444121413762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,5120,0.015471110741297403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,5120,0.03432710965474447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,3584,0.0069546666410234236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,4096,0.03128355410363939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,4096,0.014662222729788886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,3072,0.006582222051090664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,3584,0.029172443681293066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,2560,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,3072,0.028813332319259644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,3072,0.013759111364682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,2048,0.006241777704821692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1536,6144,0.016531555189026725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,2560,0.01348622226052814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,2560,0.027756444282001917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,1536,0.005562666803598404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,2048,0.026782222919993933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,1024,0.004243555582231945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,1536,0.024720888998773363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,1024,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,1024,0.02405244443151686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,768,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,12288,0.05345866746372647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,512,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,768,0.023761777414215937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,768,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,256,0.0035004446076022256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,512,0.01202311118443807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,512,0.022960889670583937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,6144,0.016224000189039443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,128,0.0031848889258172777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,256,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,256,0.021984888447655573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,64,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,1024,128,0.019949333535300363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,128,0.011353777514563667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,65536,0.023188443647490606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,64,0.011439999772442712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,32,0.011880888707107969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,51200,0.025068443682458665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,65536,0.08500444226794773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,65536,0.18779999679989287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,2048,0.013040888640615674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,51200,0.06590133243136935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,16384,0.012072000238630505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,12288,0.010822222464614444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,1536,0.012464889221721225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,51200,0.15104356076982287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,16384,0.028332445356580947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,16384,0.06411555740568373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,10240,0.010255110760529837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,12288,0.021956443786621094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,12288,0.05208977725770739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,8192,0.01110222190618515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,10240,0.020586666133668687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,10240,0.04628444380230374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,7168,0.01034311122364468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,8192,0.040700445572535195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,8192,0.018191999859280057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,6144,0.009287111461162567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,7168,0.01722400055991279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,7168,0.03850933247142368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,5120,0.00869777798652649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,6144,0.016180444094869826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,6144,0.036044445302751325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,4096,0.008092444803979661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,1024,32,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,5120,0.015585778488053216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,5120,0.03328444560368856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,3072,0.006585777633719974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,4096,0.03187911046875848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,1024,3584,0.014249778456158109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,4096,0.014494222071435718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,3584,0.029461334149042766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,3072,0.013801777528391944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,3072,0.028839998775058325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,2560,0.013481777575280933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,2560,0.027806222438812256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,1536,0.004691555682155821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,2048,0.01313066648112403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,2048,0.02639644510216183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,1024,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,1536,0.012798222402731577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,1536,0.02574666672282749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,768,0.0036106668412685394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,1024,0.012074666718641916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,1024,0.02500266664557987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,512,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,768,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,768,0.0233262214395735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,256,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,512,0.012063999970753988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,512,0.02295111119747162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,128,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,256,0.01149777736928728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,256,0.022336888644430373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,128,0.01165511127975252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,3584,0.006611555400821898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,768,128,0.018209778600268893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,65536,0.02316711180739933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,64,0.011713777979214987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,2560,0.005592888842026393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,32,0.010743111371994019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,51200,0.019143111175960965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,2048,0.0052791109515561005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,65536,0.08324178059895833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,16384,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,65536,0.18837866518232557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,51200,0.06405778063668145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,12288,0.010713777608341642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,51200,0.15145777331458196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,16384,0.027141332626342773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,10240,0.010021333065297868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,12288,0.02161866592036353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,12288,0.052946666876475014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,8192,0.008627555436558193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,10240,0.046246220668156944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,10240,0.019913777709007263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,7168,0.008330666356616551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,8192,0.040448000033696495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,6144,0.007896888587209914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,7168,0.01683822274208069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,6144,0.015972443752818637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,6144,0.03595022360483805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,5120,0.008185777399275038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,768,32,0.002518222149875429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,5120,0.0332568883895874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,5120,0.015125332607163323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,4096,0.007644444704055786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,3584,0.006940444310506185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,768,3584,0.014147554834683737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,4096,0.03122133347723219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,4096,0.014427555931939019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,3072,0.0063031112982167145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,3584,0.014162666267818876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,3584,0.02913244565327962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,2560,0.005609777652555042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,3072,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,3072,0.028888887829250757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,2048,0.005570666657553778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,2560,0.028078221612506445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,2560,0.013190222283204397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,16384,0.06237066454357571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,1536,0.004557333472702238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,1024,0.003871110992299186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,2048,0.025754666990704004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,2048,0.012788444757461548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,1536,0.02472355630662706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,1536,0.012413333687517377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,768,0.003532444437344869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,1024,0.02338933282428318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,8192,0.01825777855184343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,512,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,768,0.023081777824295893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,7168,0.03797600004408095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,256,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,512,0.022392888863881428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,512,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,128,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,256,0.011762667033407422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,256,0.02125511070092519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,64,0.0025315555847353404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,512,128,0.018203554881943595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,128,0.011760888828171624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,65536,0.018226666582955253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,64,0.01108444482088089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,32,0.011081777513027191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,51200,0.015513777732849121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,65536,0.0784719983736674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,65536,0.18613244427575004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,16384,0.010040000081062317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,51200,0.06241599718729655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,51200,0.15047555499606663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,12288,0.010415111151006486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,16384,0.026081777281231348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,16384,0.06152444415622287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,10240,0.009197333620654212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,1024,0.012376888758606382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,12288,0.02188088827662998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,12288,0.05063822203212314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,8192,0.008347555167145198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,512,768,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,10240,0.019564444820086162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,10240,0.0455057786570655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,7168,0.00795999997191959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,8192,0.01789155602455139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,8192,0.041053334871927895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,6144,0.00833511104186376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,5120,0.008007110820876228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,7168,0.01682577696111467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,7168,0.03836355606714884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,512,32,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,6144,0.03631644447644552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,6144,0.01585422290696038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,3584,0.006924444602595435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,5120,0.01511111193233066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,5120,0.033246222469541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,3072,0.00674222202764617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,4096,0.031855109665128924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,4096,0.014819555812411837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,2560,0.006324444380071428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,3584,0.013810666898886362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,3072,0.01350311107105679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,3072,0.029099557134840224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,2048,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,2560,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,2560,0.02706577711635166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,1536,0.004565333326657613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,2048,0.013199110825856527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,2048,0.02607911162906223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,1024,0.0037662221325768363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,1536,0.012437333663304647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,1536,0.02641511129008399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,768,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,1024,0.025003555748197768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,1024,0.012028444144460889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,512,0.003428444473279847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,768,0.0124177775449223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,768,0.023316444622145757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,256,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,512,0.011424000064531961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,512,0.02273955610063341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,128,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,256,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,32,0.002522666628162066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,128,0.011690666278203329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,128,0.018218666315078735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,65536,0.015321777926550971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,64,0.011014222270912595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,256,4096,0.007291555404663086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,51200,0.014767110347747803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,65536,0.07728533612357245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,16384,0.009341333475377824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,51200,0.06275644567277697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,65536,0.18685332934061685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,3584,0.029104888439178467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,12288,0.008280889027648503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,16384,0.025732444392310247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,16384,0.06163555383682251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,10240,0.009341333475377824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,12288,0.02159999973244137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,8192,0.008295111358165741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,10240,0.0448968874083625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,10240,0.019892444213231403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,7168,0.007921777665615082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,8192,0.017913776967260573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,8192,0.04007644454638163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,7168,0.01682577696111467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,7168,0.03736089004410638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,6144,0.007242666350470648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,256,256,0.02164711058139801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,5120,0.006952889263629913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,6144,0.03595911131964789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,6144,0.015792000624868605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,4096,0.006609777609507243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,256,32,0.011041777829329172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,5120,0.015480000111791821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,5120,0.033209777540630765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,3584,0.006611555400821898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,4096,0.014107555150985718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,4096,0.031112889448801678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,3072,0.006230222268237009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,3584,0.013801777528391944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,3584,0.030229333374235366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,2560,0.006325333482689328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,51200,0.14973333146837023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,2048,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,3072,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,2560,0.027059555053710938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,12288,0.05130222108629015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,2560,0.013807111316257052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,2048,0.026426666312747534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,2048,0.012717333104875354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,1024,0.003693333516518275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,1536,0.02644888891114129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,1536,0.01275288893116845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,768,0.003530666646030214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,1024,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,1024,0.02366133365366194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,512,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,768,0.02436888880199856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,768,0.01204177737236023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,256,0.0029164445069101122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,512,0.011546666423479715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,128,0.0025902222841978073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,256,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,128,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,128,0.01956977778010898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,64,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,32,0.0025315555847353404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,64,0.011420444481902652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,128,32,0.010746666954623329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,65536,0.014493332968817817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,51200,0.013768889009952545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,3072,0.02875022093454997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,65536,0.07691555553012423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,16384,0.008319999608728621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,12288,0.007640000018808577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,51200,0.06040800280041165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,128,1536,0.004538666870858935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,10240,0.007278222176763747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,8192,0.006760889043410619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,16384,0.025722665919197932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,12288,0.021078222327762183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,10240,0.0196782218085395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,6144,0.006291555447710886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,8192,0.017906667457686532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,5120,0.006263999889294307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,7168,0.01651822196112739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,4096,0.005668444352017508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,6144,0.01587377819750044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,512,0.022120889690187242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,3584,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,5120,0.015485333071814643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,3072,0.005951111101441913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,4096,0.014093332820468478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,2048,0.005952888892756567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,3584,0.013759111364682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,3072,0.013773333695199756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,1536,0.00434933313065105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,2560,0.01290844463639789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,1024,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,768,0.0035208890007601846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,2048,0.01276177747382058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,512,0.003206222214632564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,1536,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,1024,0.012062222593360476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,256,0.002732444347606765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,768,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,128,0.002537777854336633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,64,0.002477333363559511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,512,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,32,0.0025351111673646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,256,0.011027555498811932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,128,0.01146577795346578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,65536,0.014101333088344999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,64,0.010684444672531553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,51200,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,64,32,0.010657777388890585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,16384,0.007993777592976889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,12288,0.007655999726719326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,65536,0.07442844576305814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,7168,0.006296000132958095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,51200,0.06005066633224487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,10240,0.007252444823582967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,16384,0.02572000026702881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,8192,0.00657066661450598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,7168,0.006625777731339137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,10240,0.019575999842749704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,8192,0.017532444662517972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,6144,0.0064897777305708984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,5120,0.005947555518812603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,7168,0.016840888394249808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,80,128,256,0.02164799968401591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,4096,0.0057884446448749965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,64,2560,0.005973333285914526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,6144,0.015763555963834126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,3584,0.005941333456171884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,3072,0.005927111125654644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,5120,0.015135111080275642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,2560,0.005951111101441913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,2048,0.005710222240951326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,4096,0.014819555812411837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,3584,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,1536,0.0042239998777707415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,1024,0.0038764443662431505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,2560,0.013188444077968597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,768,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,2048,0.012736000120639801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,512,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,1536,0.012378666963842181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,1024,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,256,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,128,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,768,0.011768889096048145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,64,0.002487999904486868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,512,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,80,32,32,0.002489777695801523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,256,0.011737777955002256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,128,0.010755555497275459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,64,0.010399111443095738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,32,0.010240889257854885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,12288,0.021314667330847845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,16384,0.2104168865415785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,16384,0.38184711668226456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,12288,0.29075466261969674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,51200,0.6231519911024306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,10240,0.21823733382754854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,12288,0.15805421935187444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,8192,0.17415822876824272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,10240,0.13497243987189397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,7168,0.15383022361331516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,8192,0.11534578270382351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,6144,0.13268533017900255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,51200,1.209652476840549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,5120,0.11379022068447536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,6144,0.08671200275421143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,4096,0.09171644184324478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,5120,0.0742702219221327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,7168,0.09861422247356838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,4096,0.062499556276533336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,3072,0.07004533211390178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,2560,0.05863910913467407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,2048,0.04876533481809828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,3072,0.050494223833084106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,2560,0.04509511258867052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,1536,0.03696799940533108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,2048,0.04004355602794223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,3584,0.05731733640034994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,1024,0.027247111002604168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,80,32,3072,0.013529777526855469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,768,0.02091377807988061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,1536,0.05465244584613376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,512,0.014813333749771118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,256,0.009391110804345872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,128,0.007243555453088548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,1024,0.03975377811325921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,768,0.03127288818359375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,512,0.025042666329277888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,256,0.01953066719902886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,128,0.017512889371977914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,64,0.017761778500345018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,65536,32,0.02100533412562476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,3584,0.0795253316561381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,65536,0.6506720119052464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,16384,0.2765057881673177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,51200,0.4964622391594781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,51200,0.8513164520263672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,65536,1.0837280485365126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,64,0.005225777626037598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,65536,32,0.005340444544951121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,12288,0.20837777190738252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,8192,0.14175555441114637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,10240,0.1739351087146335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,8192,0.0939191116227044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,12288,0.12748800383673772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,16384,0.1690080033408271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,7168,0.0806257790989346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,6144,0.1073039968808492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,10240,0.10952622360653347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,7168,0.1249048842324151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,4096,0.0739555557568868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,5120,0.06157955858442518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,6144,0.07147644625769721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,3584,0.0656906697485182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,4096,0.05236000153753492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,3072,0.05758755736880832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,2560,0.048476444350348584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,3584,0.048269334766599864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,2048,0.03932977716128031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,3072,0.042986667818493314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,1536,0.0313022236029307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,2560,0.03858222232924567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,1024,0.02313333253065745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,768,0.01682044400109185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,512,0.012368888490729861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,1536,0.04399111204677158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,256,0.008323555191357931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,768,0.027071999178992376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,128,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,512,0.022052443689770166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,64,0.004527111020353106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,256,0.0174666659699546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,32,0.004919111314747068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,128,0.016187555260128446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,64,0.015959110524919298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,32,0.01891911029815674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,65536,0.31793689727783203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,65536,0.2549040052625868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,51200,0.2502426571316189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,51200,5120,0.09120711353090073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,16384,0.08298489120271471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,12288,0.06451644500096639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,51200,0.19604978296491835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,16384,0.07071110937330458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,10240,0.053660445743136935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,12288,0.0551546679602729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,8192,0.046205331881841026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,2048,0.03477333320511712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,7168,0.03926755653487311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,10240,0.048688001102871366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,6144,0.0343795551194085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,5120,0.029657777812745836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,8192,0.042931556701660156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,6144,0.03443200058407254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,4096,0.025058666865030926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,3584,0.021904889080259535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,5120,0.030994666947258845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,3072,0.019241778386963736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,4096,0.02643199927277035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,3584,0.02587022218439314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,2048,0.013391111459996967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,3072,0.023004444109068975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,1536,0.011047999891969891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,2560,0.020928000410397846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,1024,0.008960888617568547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,2048,0.01972888906796773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,768,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,1536,0.02260977857642704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,512,0.005579555614127054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,1024,0.019281778070661757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,256,0.003912000192536248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,768,0.01711466742886437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,512,0.01550044450494978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,128,0.0035075553589397003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,64,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,32,0.003536000019974179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,128,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,64,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,32,0.014451555079884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,51200,1024,0.033420443534851074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,7168,0.03799110982153151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,65536,0.25451376703050405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,16384,0.0709457794825236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,65536,0.2020862234963311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,51200,0.19724088244967988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,16384,2560,0.016176889340082806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,51200,0.15662488672468397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,10240,0.04562844501601326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,8192,0.03981066743532816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,16384,0.05850044223997328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,10240,0.040829333994123675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,7168,0.03333066569434272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,6144,0.028841776980294123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,8192,0.03657955593532986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,5120,0.0251519994603263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,7168,0.03247377938694424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,4096,0.022302221920755174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,6144,0.029701332251230877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,5120,0.02641777859793769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,3072,0.016545777519543965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,4096,0.023073777556419373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,2560,0.01402311192618476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,16384,256,0.013075555364290873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,2048,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,3072,0.020455110404226515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,3584,0.021872889664438035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,1536,0.010299555957317352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,1024,0.008300444318188561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,2560,0.019392000304328073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,768,0.007051555646790399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,2048,0.018183999591403537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,1536,0.020581333173645865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,512,0.0052177777720822235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,256,0.003907555507289039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,1024,0.017284444636768766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,768,0.016159110599093966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,512,0.014675555957688225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,128,0.0037955554823080697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,64,0.0032319999817344877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,256,0.012856889102194043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,12288,0.055063999361462064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,32,0.003648888733651903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,128,0.012541333006487953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,64,0.012914666699038612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,12288,0.046224001381132335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,12288,32,0.012661333713266583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,65536,0.2170142200258043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,51200,0.16900266541375053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,65536,0.1934880018234253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,51200,0.1508151160346137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,12288,3584,0.01854933301607768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,10240,0.04080977704789903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,16384,0.05651199817657471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,12288,0.0445128877957662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,8192,0.03906844390763177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,10240,0.03932711150911119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,7168,0.030235555436876085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,6144,0.028697778781255085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,8192,0.034832000732421875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,5120,0.022636445032225713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,4096,0.020469332734743755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,6144,0.028597331709331934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,7168,0.03123289015558031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,5120,0.02574488851759169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,3584,0.016923555069499545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,4096,0.02221600049071842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,2560,0.013378666506873237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,3584,0.021384000778198242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,3072,0.020232889387342665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,2048,0.011385777758227454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,1536,0.010034666293197209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,2560,0.018909333480728995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,1024,0.007932444413503012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,2048,0.017881777551439073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,1536,0.019139554765489366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,768,0.006566222343179915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,1024,0.01608711149957445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,16384,0.06327111191219754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,256,0.0041422223051389056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,768,0.015206222732861837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,12288,0.04635555545488993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,128,0.003571555432346132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,64,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,256,0.012437333663304647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,32,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,128,0.01241422196229299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,64,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,32,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,65536,0.1765537791781955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,51200,0.13368711206648085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,65536,0.15062667263878718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,3072,0.015136000182893542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,16384,0.05145422286457486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,12288,0.0376853346824646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,10240,0.03126400046878391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,16384,0.045604444212383695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,51200,0.11686044269137913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,12288,0.03643466697798835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,8192,0.026868444350030687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,7168,0.023401778605249193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,6144,0.020262221495310467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,10240,0.0328746669822269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,5120,0.017850667238235474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,8192,0.029027554723951552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,7168,0.025571554899215698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,6144,0.023706666297382776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,3584,0.013374221821626028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,3072,0.012136889000733694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,4096,0.019941333267423842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,2560,0.01036000003417333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,3584,0.01924977699915568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,2048,0.009336888790130615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,3072,0.018200000127156574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,1536,0.007920888562997183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,2560,0.017216889394654166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,2048,0.016362667083740234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,1024,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,1536,0.016605334149466622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,768,0.004905777672926585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,512,0.00423555572827657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,1024,0.01513777838812934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,256,0.0035253332720862497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,768,0.014447111222479077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,128,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,512,0.013076444466908773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,64,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,256,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,32,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,128,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,64,0.011427555647161273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,32,0.012509333590666452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,65536,0.15539556079440647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,8192,4096,0.015477332803938123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,10240,512,0.004918222212129169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,8192,5120,0.02137600051032172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,65536,0.14658310678270128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,51200,0.126111110051473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,12288,0.03516355488035414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,51200,0.11470044983757867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,10240,512,0.014016888207859464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,10240,0.02976177798377143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,16384,0.04456622070736355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,8192,0.025555556019147236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,12288,0.036208887894948326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,7168,0.022090666823916968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,6144,0.019471999671724107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,5120,0.016584000653690763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,7168,0.024716445141368445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,8192,0.028259555498758953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,6144,0.02321333355373806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,4096,0.014281777871979607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,3584,0.012721777790122561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,3072,0.01168444421556261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,4096,0.01959111127588484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,3584,0.01887022289964888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,2560,0.010024000373151567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,2048,0.009017777939637503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,3072,0.017940445078743827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,1536,0.007647111184067196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,2560,0.01719999975628323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,1024,0.005756444401211209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,1536,0.01683555543422699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,768,0.004559999952713649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,1024,0.014764444695578681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,512,0.0038968887594011095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,768,0.01420177850458357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,16384,0.04689155684577095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,256,0.0032666667054096856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,512,0.013472889032628802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,128,0.0033822223130199644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,64,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,256,0.012431110772821637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,128,0.011476444701353708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,7168,32,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,64,0.011384000380833944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,10240,0.03207022282812331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,32,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,65536,0.12563110722435847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,51200,0.10067822535832723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,16384,0.038823998636669584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,65536,0.1416355503929986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,12288,0.03234400020705329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,51200,0.11052622397740682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,16384,0.043042666382259794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,10240,0.028287112712860107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,8192,0.024660444921917383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,12288,0.035022222333484225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,7168,0.020562666985723708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,10240,0.030850665436850652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,2048,0.015187554889255099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,8192,0.027433777848879497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,5120,0.01573600040541755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,7168,0.02421333392461141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,4096,0.013004444539546967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,3584,0.011693333586057028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,6144,0.022427555587556627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,5120,0.020945777495702107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,3072,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,4096,0.01927199959754944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,2560,0.009335111412737105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,2048,0.008665777742862701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,3584,0.018581334087583754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,1536,0.007296000089910295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,3072,0.017669333351982962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,2560,0.016192000773217943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,1024,0.0061928890645504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,2048,0.014656888114081489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,768,0.004928888960017098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,512,0.004230222354332606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,1536,0.01625688870747884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,256,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,128,0.0033866665843460294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,512,0.01309866706530253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,64,0.002971555623743269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,256,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,32,0.003107555624511507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,128,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,7168,5120,0.021205332544114854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,64,0.012427555190192329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,32,0.01143555591503779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,65536,0.11755732695261638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,51200,0.0935786697599623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,16384,0.03386933273739285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,6144,6144,0.017975999249352347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,65536,0.13806845082177058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,12288,0.02791644467247857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,10240,0.024646222591400146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,51200,0.10811022255155776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,16384,0.04221777783499824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,8192,0.021536888347731695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,12288,0.03371644351217482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,7168,0.01884622209601932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,10240,0.02896089024013943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,6144,0.01683022247420417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,8192,0.026326222552193537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,5120,0.01443822185198466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,7168,0.02405422263675266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,4096,0.01145066652033064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,6144,0.022356443934970435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,3584,0.01016622202263938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,3072,0.009305777649084726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,5120,0.020695999264717102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,4096,0.019273777802785236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,2560,0.009226666556464301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,3584,0.018554665976100497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,2048,0.008229333493444655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,1024,0.014440000057220459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,1536,0.006605333338181178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,6144,768,0.014076444837782117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,1024,0.00544177782204416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,768,0.004875555634498596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,2048,0.014774221513006421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,512,0.0041964443193541635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,1024,0.014106666048367819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,768,0.01366133325629764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,256,0.0034942221310403612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,128,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,512,0.013080889152155982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,64,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,256,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,128,0.011409777734014722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,64,0.0124195557501581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,32,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,65536,0.08872355355156793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,51200,0.07179111242294312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,65536,0.09747911161846584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,16384,0.03052799900372823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,51200,0.07682577768961589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,12288,0.02414488957987891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,3072,0.01681155628628201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,16384,0.03089155422316657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,2560,0.015480000111791821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,10240,0.02162666618824005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,8192,0.018738667170206707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,12288,0.025046222739749487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,5120,1536,0.014800000521871777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,7168,0.0169804443915685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,10240,0.022864888111750286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,6144,0.01583377851380242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,5120,0.013967111706733704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,4096,0.01036888857682546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,6144,0.01863822175396813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,3584,0.009660444325870937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,5120,0.01720622181892395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,3072,0.008756444685988957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,5120,32,0.0028906667398081887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,4096,0.016158221496476066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,2560,0.007643555601437886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,3584,0.015545777148670621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,2048,0.006490666833188798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,3072,0.014458666245142618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,1536,0.0052488889131281115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,2560,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,1024,0.004179555508825514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,768,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,2048,0.013427555561065674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,512,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,1536,0.014120888378885059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,1024,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,768,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,512,0.012463111016485425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,256,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,64,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,128,0.011713777979214987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,32,0.0031848889258172777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,64,0.011032000184059143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,65536,0.08500711123148601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,32,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,8192,0.020991999242040846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,4096,7168,0.01963555481698778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,51200,0.06872710916731092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,16384,0.027149332894219294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,12288,0.021685333715544805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,65536,0.09421333339479233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,51200,0.07491644223531087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,10240,0.0188755558596717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,16384,0.030026667647891577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,8192,0.017308443784713745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,12288,0.024494222468800012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,10240,0.02198666665289137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,7168,0.015829333000712924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,8192,0.020595555504163105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,6144,0.014774221513006421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,5120,0.013302221894264221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,7168,0.019302222463819716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,256,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,3584,0.010020444790522257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,6144,0.018242667118708294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,5120,0.017235555582576327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,3072,0.009322666459613377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,4096,128,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,4096,0.015779554843902588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,3584,0.014779556128713818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,2048,0.006179555422729916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,1536,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,2560,0.014149333039919535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,1024,0.004277333203289243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,2048,0.013415111435784234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,768,0.004026666697528628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,1536,0.013824000126785703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,512,0.003559999995761447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,1024,0.013335111240545908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,256,0.0031911111954185697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,768,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,128,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,512,0.01242844429281023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,64,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,256,0.011769777370823754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,32,0.003019555575317807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,128,0.011416888899273343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,64,0.011128000087208219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,32,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,51200,0.06052177482181125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,65536,0.09244355228212144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,4096,0.011345778074529437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,16384,0.022298667165968154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,12288,0.018924444913864136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,51200,0.07273155450820923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3584,2560,0.007314666277832455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,10240,0.016559999850061204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,8192,0.014212444424629211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,12288,0.023686221904224817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3584,3072,0.014143110977278816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,7168,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,10240,0.021871111459202234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,6144,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,5120,0.01092977739042706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,8192,0.020253333780500624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,7168,0.018750222192870248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,6144,0.017843556072976854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,3584,0.008966222405433655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,5120,0.01646577815214793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,3072,0.008097777764002482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,4096,0.014789332946141561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,2560,0.0070222218831380205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,3584,0.01477688882086012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,2048,0.0063235556913746735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,3072,0.014099554883109199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,1536,0.005280888742870755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,2560,0.013742222554153867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,1024,0.0042462220622433555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,65536,0.0750088890393575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,2048,0.013382222089502545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,768,0.003911111089918348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,1536,0.01353422221210268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,512,0.003564444267087512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,1024,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,256,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,128,0.0029395555870400537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,768,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,512,0.012426666915416718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,64,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,32,0.0029519999192820657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,256,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,128,0.011419555379284753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,16384,0.028956443071365356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,64,0.01108266661564509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,65536,0.06442666716045804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,3072,32,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,16384,0.019898666275872123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,12288,0.01625155574745602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,65536,0.0893591112560696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,10240,0.014884443746672736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,16384,0.027781334188249376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,51200,0.07045777638753255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,12288,0.023303111394246418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,3072,4096,0.009335111412737105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,7168,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,6144,0.011681777735551199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,10240,0.02163822286658817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,5120,0.010013333625263637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,8192,0.019732443822754752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,4096,0.008976000050703684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,7168,0.018160000443458557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,3584,0.008634666601816813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,6144,0.01717688971095615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,3072,0.007965332931942409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,5120,0.016146666473812528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,2560,0.006656000183688269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,4096,0.014799111419253878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,2048,0.005919999960396025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,3584,0.014466666513019137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,1536,0.0052737775776121355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,3072,0.013768889009952545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,1024,0.004231111043029361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,2560,0.013788444300492605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,768,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,512,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,2048,0.013119999733236102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,1536,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,256,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,1024,0.012768000364303589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,128,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,768,0.012721777790122561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,64,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,512,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,256,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,32,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,128,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,65536,0.05256977677345276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,32,0.010739555789364709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,51200,0.04182755615976122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,16384,0.017650667164060805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,51200,0.04788088798522949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,65536,0.08641599946551853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,12288,0.01443377799457974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,51200,0.06885866986380683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,10240,0.013395555317401886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,16384,0.026723555392689172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,8192,0.011988444460762871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,12288,0.023382221659024555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,7168,0.011243555280897351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,10240,0.020971554848882887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,6144,0.012097777591811286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,5120,0.010593777729405297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,8192,0.01869155632125007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,7168,0.017875555488798354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,4096,0.01054044481780794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,3584,0.009033777647548253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,6144,0.016512889001104567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,3072,0.00927466650803884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,5120,0.015240000353919135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,2560,0.007613333563009898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,4096,0.0148026661740409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,3584,0.014456000592973499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,2048,0.006937777830494775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,1536,0.00591555568906996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,3072,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,1024,0.004917333523432414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,2048,0.013064000341627332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,768,0.003896000070704354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,1536,0.013232889274756113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,512,0.003531555748648114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,1024,0.012079999678664737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,256,0.0031991110493739447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,768,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2560,64,0.011077333655622272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,128,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,512,0.012456888953844706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,64,0.002879111096262932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,256,0.011570666399266986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2048,32,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,128,0.011364444262451597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,65536,0.04026844435267978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,64,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,51200,0.03234666585922241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,16384,0.014856000741322836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,2560,8192,0.013244444297419654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,12288,0.015803555647532146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,65536,0.08373422092861599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,51200,0.06648711363474528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,10240,0.013340444200568728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,16384,0.026354667213228013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,8192,0.012080888781282636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,12288,0.022809776994917128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,7168,0.011404444773991903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,10240,0.020774222082561918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,6144,0.010747555229398938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,8192,0.017521777086787753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,5120,0.00998044427898195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,7168,0.01720355616675483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,4096,0.008963555925422246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,3584,0.007264888948864407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,5120,0.01512888901763492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,4096,0.014781332678265043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,3072,0.006592888798978593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,2560,0.005951111101441913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,3584,0.014269333746698169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,2048,0.0052284445199701525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,3072,0.014114666316244336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,1536,0.005221333354711533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,2560,0.013415999710559845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,1024,0.0041946665280395085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,2048,0.013074666261672974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,768,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,1536,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,512,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,1024,0.012318222059143914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,256,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,32,0.010716444088353051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,768,0.012390221986505719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,128,0.002985777747299936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,64,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,512,0.012111110819710625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1536,32,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,256,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,128,0.01131199962562985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,65536,0.029442667961120605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,64,0.011008888483047485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,51200,0.024111110303137038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,32,0.011032000184059143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,16384,0.01272266689274046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,12288,0.013047999805874295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,51200,0.06276266442404853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,16384,0.02625600000222524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1536,6144,0.01621955633163452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,12288,0.021899556120236714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,8192,0.010375111467308467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,2048,2560,0.013474666410022311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,7168,0.01148799972401725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,6144,0.0124177775449223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,10240,0.019588443968031142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,8192,0.017613333132531907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,5120,0.009681777821646797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,4096,0.009013333254390294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,6144,0.016152888536453247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,3584,0.007967111137178209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,5120,0.015285332997639975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,4096,0.014441778262456259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,3584,0.014472888575659858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,2560,0.005928888916969299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,3072,0.013770666387346057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,2048,0.007312888900438945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,2560,0.013800000150998434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,1536,0.005584888988071018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,2048,0.01295111080010732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,1024,0.004567999806669024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,1536,0.013103110922707452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,65536,0.0803555581304762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,768,0.003891555385457145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,1024,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,512,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,256,0.0031999999450312722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,10240,0.011604444848166572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,768,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,128,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,64,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,256,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,32,0.003141333245568805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,128,0.011355555719799466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,7168,0.016840888394249808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,65536,0.02401688860522376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,32,0.011439999772442712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,51200,0.024197333388858374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,16384,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,1024,3072,0.006622222148709827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,12288,0.010683555569913654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,65536,0.07784710990058051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,51200,0.06133244434992472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,10240,0.010404444403118556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,16384,0.025841777523358662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,8192,0.012819555898507437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,7168,0.011364444262451597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,12288,0.021168000168270532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,10240,0.019627556204795837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,8192,0.01752088963985443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,7168,0.016599110431141324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,5120,0.00866844422287411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,4096,0.007603555917739868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,6144,0.016187555260128446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,3584,0.006993778049945831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,5120,0.015167999598715039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,3072,0.00630044440428416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,4096,0.014428445034556918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,2560,0.005611555443869696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,3584,0.014567111929257711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,2048,0.0052355556852287715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,3072,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,512,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,1536,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,2560,0.013402666482660504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,1024,0.0041999999019834726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,2048,0.013103110922707452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,768,0.003863111138343811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,512,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,1536,0.012741333080662621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,1024,64,0.011439111497667102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,1024,0.012120889292822944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,256,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,128,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,768,0.0127688886390792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,64,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,512,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,32,0.0025475554996066624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,256,0.011708444191349877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,65536,0.022392888863881428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,128,0.011086222198274402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,64,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,51200,0.018225777480337355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,768,32,0.010694222317801582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,16384,0.012274666792816587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,12288,0.011018666956159802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,65536,0.07529333564970228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,10240,0.009551111194822524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,51200,0.05958844555748833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,768,6144,0.009351111120647853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,12288,0.02130844526820713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,7168,0.008017777568764156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,6144,0.007834666305118138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,10240,0.019813333948453266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,8192,0.017266665895779926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,5120,0.008307555483447181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,7168,0.016910221841600206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,4096,0.007594666547245449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,6144,0.015810666812790763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,5120,0.015113777584499784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,3072,0.006279110908508301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,4096,0.014633778068754407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,2560,0.005586666779385672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,3584,0.014157333307796054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,2048,0.0053591111467944244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,3072,0.013481777575280933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,1536,0.004744889007674323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,2560,0.013775111072593264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,1024,0.003927999900446998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,2048,0.01308444473478529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,768,0.003670222229427762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,1536,0.012552888856993781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,512,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,1024,0.012439111040698158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,256,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,768,0.012383999923865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,128,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,512,0.011767110890812345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,64,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,256,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,32,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,128,0.011407111254003314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,8192,0.008618666893906063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,65536,0.01824977828396691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,64,0.011030221978823343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,51200,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,32,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,16384,0.009879999690585667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,12288,0.00999466660949919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,65536,0.07203377617730035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,51200,0.0584462218814426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,10240,0.008987555901209513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,16384,0.024696888195143804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,8192,0.008296888735559251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,512,3584,0.007055111229419708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,12288,0.020970667401949566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,7168,0.00795377790927887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,10240,0.018890667292806838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,8192,0.017649778061442904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,5120,0.007996444072988298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,7168,0.016325333052211337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,6144,0.015531554818153381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,3584,0.0069191112286514705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,5120,0.01531377765867445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,3072,0.006281777802440856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,3584,0.014108444253603617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,2560,0.005594666633341048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,3072,0.013839999834696451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,2048,0.004946666873163647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,2560,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,1536,0.004226666771703296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,2048,0.01309866706530253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,1024,0.0037235555549462638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,512,16384,0.02462844385041131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,768,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,1024,0.012433778080675336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,512,0.0031786666562159858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,768,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,256,0.002891555635465516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,512,0.012075555821259817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,128,0.002628444383541743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,6144,0.008340444829728868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,256,0.011371555427710215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,64,0.002543111021320025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,32,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,256,4096,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,128,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,64,0.010685332947307162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,65536,0.015233778291278414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,51200,0.014783110883500842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,32,0.011052444577217102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,16384,0.009543110926946005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,12288,0.009324444664849175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,65536,0.0715528859032525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,10240,0.00903555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,51200,0.05681600173314413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,16384,0.024272888898849487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,7168,0.009039999710188972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,12288,0.020584889584117465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,10240,0.01958577831586202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,6144,0.008316444853941599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,8192,0.01717333330048455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,5120,0.007923555870850882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,7168,0.016549333930015564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,6144,0.015951111912727356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,5120,0.014807111687130399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,1536,0.012502222425407834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,3584,0.0069439998931354946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,3072,0.006303999986913469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,4096,0.014486221803559197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,2560,0.006231110956933763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,2048,0.004925333377387789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,3584,0.014076444837782117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,3072,0.013797333670987023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,1536,0.004530666602982415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,2560,0.013468444347381592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,1024,0.003907555507289039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,768,0.003485333174467087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,2048,0.012777778009573618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,1536,0.012869333227475485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,512,0.0037884443170494507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,768,0.012112889024946423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,256,0.003126222226354811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,512,0.012113778127564324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,128,0.0025155554629034465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,256,4096,0.014119111829333834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,64,0.002528000002106031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,256,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,32,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,128,0.011559999651379056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,8192,0.00795199970404307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,65536,0.016558221644825406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,64,0.010406222608354356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,51200,0.015480889214409722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,32,0.010491555763615502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,16384,0.009336888790130615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,12288,0.008330666356616551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,65536,0.06836711035834418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,128,4096,0.007246221933099959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,51200,0.05493333273463779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,10240,0.007599111232492659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,16384,0.023782221807373896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,8192,0.00794933322403166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,7168,0.007327111230956183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,12288,0.02095111045572493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,6144,0.006973333656787872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,10240,0.01886488828394148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,8192,0.017200888858901132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,5120,0.0069226668112807805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,4096,0.006285333385070165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,7168,0.016357334123717416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,3584,0.0059368887709246735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,6144,0.016175111134847004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,3072,0.005959110955397288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,5120,0.0147724449634552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,4096,0.014121777481502958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,2560,0.006241777704821692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,2048,0.005944889038801193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,1536,0.0041866666740841335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,3072,0.013801777528391944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,128,1024,0.01238666640387641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,1024,0.0035866668654812705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,768,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,1536,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,512,0.003050666716363695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,1024,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,256,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,768,0.012539555629094442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,128,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,512,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,64,0.002522666628162066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,256,0.011508444117175208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,64,32,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,128,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,65536,0.016156444946924847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,64,0.010348444183667501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,51200,0.01517955627706316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,32,0.010796444283591377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,16384,0.009345778160625035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,65536,0.06826221942901611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,51200,0.05507377783457438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,12288,0.008307555483447181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,16384,0.02416177756256527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,10240,0.007644444704055786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,8192,0.00795022232664956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,12288,0.0207004447778066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,10240,0.019155555301242404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,7168,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,3584,0.013869333598348828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,8192,0.01757244434621599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,6144,0.0069395556218094295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,5120,0.0069413334131240845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,4096,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,2048,0.012771555946932899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,7168,0.01650044487582313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,6144,0.015469332536061605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,3584,0.006252444452709622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,3072,0.005716444303592046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,4096,0.014116444521480136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,3584,0.014083556003040738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,3072,0.013440888788965015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,2048,0.0059057776298787855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,1536,0.004530666602982415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,2560,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,1024,0.0038248888320393036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,768,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,2048,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,1536,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,512,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,1024,0.012034667034943899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,256,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,768,0.012160888976520963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,128,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,512,0.011760888828171624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,256,0.011161777708265515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,32,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,128,0.011415999796655444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,64,0.011388444238238864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,32,0.010198222266303169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,64,2560,0.012826667063766055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,65,32,5120,0.01536355581548479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,65,32,2560,0.005952000204059813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,51200,0.5233884387546116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,16384,0.17917866177029082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,16384,0.3691555658976237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,12288,0.2704177697499593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,12288,0.13550489478641087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,51200,1.12880982293023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,10240,0.2280933327145047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,8192,0.18536978297763398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,10240,0.11568355560302734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,8192,0.09886755545934041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,7168,0.16107555230458578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,7168,0.0845057765642802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,6144,0.13904533121320936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,6144,0.07511644230948554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,10240,0.1860897805955675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,12288,0.22247023052639434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,5120,0.11843110455407037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,5120,0.06473066409428914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,16384,0.2914942105611165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,8192,0.15540711085001627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,7168,0.1391377713945177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,3584,0.08419733577304417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,4096,0.09473777479595608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,4096,0.05525955557823181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,6144,0.12331288390689427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,3072,0.07410222291946411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,4096,0.09311466746860081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,3072,0.0448657770951589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,2560,0.06302044126722547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,5120,0.1095306674639384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,2048,0.05236088898446825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,3584,0.08635555373297797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,2560,0.03997066617012024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,3072,0.07949066824383207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,1536,0.0407591097884708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,2048,0.035571555296579994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,2560,0.07022044393751356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,1536,0.030241777499516804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,1024,0.030048890246285334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,2048,0.06396622127956815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,768,0.02292888859907786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,1536,0.05578844414816963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,1024,0.024324445260895625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,512,0.015600000818570455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,1024,0.04863644308514065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,768,0.02072622213098738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,256,0.009331555830107795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,768,0.04317422376738655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,128,0.006871999965773688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,512,0.017519111434618633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,512,0.03775022096104092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,256,0.03297066688537598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,256,0.015822221835454304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,32,0.00490133340160052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,128,0.026776888304286536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,128,0.014131555954615274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,64,0.01483022173245748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,32,0.01889866590499878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,65536,0.553642643822564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,51200,0.8639733526441785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,65536,1.1087875366210938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,65536,64,0.004658666749795278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,65536,3584,0.050072001086341016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,51200,0.4254755443996853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,16384,0.282458676232232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,16384,0.14587467246585423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,12288,0.21127555105421278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,10240,0.1772995524936252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,65536,51200,0.9256177478366427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,12288,0.11101866430706447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,8192,0.1438995599746704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,10240,0.09535377555423313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,8192,0.08211911386913724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,7168,0.1262471146053738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,7168,0.07083377573225233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,12288,0.1880426671769884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,6144,0.10595111052195232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,16384,0.24313333299424914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,5120,0.09222666422526042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,6144,0.06311644448174371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,8192,0.1347742213143243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,4096,0.07558933231565687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,5120,0.054937776592042714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,7168,0.1220746702618069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,10240,0.1623120043012831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,3584,0.06660888592402141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,4096,0.04727466570006477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,6144,0.1091724435488383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,3072,0.05821955866283841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,3584,0.0428088903427124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,5120,0.09518755806816949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,2560,0.04838133189413282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,4096,0.08295910888248019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,3072,0.03901422354910109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,2048,0.040397332774268255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,2560,0.034865776697794594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,3584,0.07629688580830891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,3072,0.06971644692950778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,2048,0.031288888719346784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,1536,0.03210044569439358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,2560,0.06321066617965698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,1024,0.023519999451107446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,2048,0.05629511011971367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,1536,0.026399999856948853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,768,0.017172444197866652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,1024,0.02055999967787001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,1536,0.051170667012532554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,1024,0.04383200075891283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,512,0.012083555261294046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,256,0.008002666963471307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,768,0.01829600003030565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,768,0.039108445247014366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,128,0.0052560000783867305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,512,0.01681422193845113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,512,0.03474222289191352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,256,0.03046400017208523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,64,0.004570666700601578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,51200,32,0.004871110949251386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,128,0.02608355548646715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,64,0.014104000396198697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,32,0.0162426663769616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,65536,0.34942489200168186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,65536,0.21131466494666207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,51200,0.27499111493428546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,51200,0.16245955891079372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,16384,0.08251200119654338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,256,0.014268444644080268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,16384,0.061069336202409535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,51200,128,0.01312622262371911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,12288,0.06445866823196411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,12288,0.04827466607093811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,10240,0.053448001543680825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,51200,0.7486222055223254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,16384,0.07817066378063627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,12288,0.06289511256747775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,10240,0.04216444492340088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,8192,0.04519288738568624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,51200,65536,0.9592026604546441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,7168,0.03917600048912896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,8192,0.036920001109441124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,6144,0.034099555677837796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,10240,0.05762844615512424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,8192,0.05081689026620653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,6144,0.03013422091801961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,7168,0.036306666003333196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,7168,0.04758933186531067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,65536,0.2359466552734375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,4096,0.025459556115998164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,6144,0.045033779409196645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,51200,0.18461510870191786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,3584,0.02181333303451538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,5120,0.0418524444103241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,3072,0.019349333312776353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,4096,0.03641866644223531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,3584,0.036269333627488874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,3584,0.02259822189807892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,3072,0.020821332931518555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,3072,0.034272889296213783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,2048,0.013387555877367655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,2560,0.01925155520439148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,2560,0.03201866812176175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,1536,0.010659555594126383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,2048,0.017942221628295053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,2048,0.03133777777353922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,1024,0.009341333475377824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,1536,0.016913778252071805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,1536,0.029170665476057265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,768,0.007248889240953658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,1024,0.027744000156720478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,768,0.013593778014183044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,5120,0.029496888319651287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,512,0.006214222146405115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,768,0.02535111043188307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,256,0.00388711111413108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,512,0.0224906669722663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,512,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,5120,0.02740977704524994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,128,0.0036151111125946045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,256,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,256,0.020969778299331665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,64,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,4096,0.024822221861945257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,32,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,128,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,16384,128,0.018522666560279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,64,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,32,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,16384,2560,0.016114667057991028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,65536,0.24858665466308594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,65536,0.1879040002822876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,51200,0.19625422689649794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,16384,0.06695289081997342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,51200,0.1450079944398668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,12288,0.053540445036358304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,16384,0.054084443383746676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,12288,0.04305155409706963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,16384,1024,0.015111999379263984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,10240,0.04386666748258802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,12288,0.056187556849585645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,16384,0.06883377499050565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,10240,0.038211554288864136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,8192,0.03685599896642897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,7168,0.032315555546018816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,10240,0.051170667012532554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,8192,0.03416266706254747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,6144,0.02791022260983785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,8192,0.0481608874268002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,7168,0.03056710958480835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,5120,0.024490666058328416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,7168,0.043419556485282056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,6144,0.027987556325064764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,4096,0.020661332541041903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,5120,0.025072889195548162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,5120,0.03756266501214769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,3584,0.01792533364560869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,4096,0.021627555290857952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,4096,0.034847110509872437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,3584,0.02057422200838725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,3584,0.03393244412210252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,2560,0.013576000101036496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,3072,0.019542222221692402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,3072,0.0326204432381524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,2048,0.011585777832402123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,2560,0.018552889426549275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,2560,0.031143999762005273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,1536,0.009424000150627559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,2048,0.017504000001483493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,2048,0.02954933378431532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,1024,0.007708444363541073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,1536,0.01590755581855774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,1536,0.028471999698215063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,768,0.006550222221348021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,1024,0.02583911187118954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,6144,0.041469332244661115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,768,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,768,0.02342844506104787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,65536,0.1975253290600247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,512,0.004885333279768626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,512,0.021595555875036452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,256,0.0037760001917680106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,512,0.01238222254647149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,128,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,256,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,256,0.020284444093704224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,64,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,128,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,32,0.003491555651028951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,64,0.011406222151385413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,32,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,65536,0.22192977534400093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,65536,0.1772915522257487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,51200,0.17448088857862684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,12288,1024,0.013768889009952545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,51200,0.1371955606672499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,16384,0.05394133263164096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,51200,0.15886221991644964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,12288,0.04279555545912849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,16384,0.052079998784595065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,12288,0.04177511069509718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,12288,3072,0.01588444411754608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,16384,0.0654968884256151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,10240,0.03492710987726847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,12288,128,0.018538667096032035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,8192,0.02984444300333659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,12288,0.054216000768873424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,10240,0.037068443165885076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,7168,0.025828444295459326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,8192,0.03269155489073859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,10240,0.04998488889800178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,6144,0.0229404436217414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,65536,0.18659644656711152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,8192,0.04536622100406223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,7168,0.029393778906928167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,51200,0.1503804392284817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,5120,0.019816888703240287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,7168,0.042488889561759106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,6144,0.026657778355810378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,6144,0.03952444593111674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,3584,0.014631110760900708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,5120,0.023657777243190344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,5120,0.037392887804243304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,4096,0.02200088898340861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,3072,0.013120888835854001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,4096,0.03425777620739407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,2560,0.011386666860845355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,3584,0.020177778270509508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,3072,0.019273777802785236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,3072,0.03257955445183648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,2048,0.009955555200576782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,2560,0.03187111020088196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,2560,0.018180444836616516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,1536,0.008225777910815345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,1024,0.006888888776302338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,2048,0.02924799919128418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,2048,0.01718755563100179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,1536,0.02808088726467556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,1536,0.015800888339678448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,768,0.005251555393139522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,1024,0.013061333033773633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,1024,0.02466933263672723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,512,0.004181333300140169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,768,0.0232924438185162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,768,0.012832000023788877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,256,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,512,0.012330667012267642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,512,0.021951110826598272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,128,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,256,0.02023555503951179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,256,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,64,0.0032026666320032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,128,0.011364444262451597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,32,0.0034799998005231223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,64,0.01221155540810691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,10240,32,0.011352889239788055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,65536,0.18196622530619302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,10240,4096,0.017498667041460674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,65536,0.12843110826280382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,51200,0.14388533433278403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,3584,0.03412355648146735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,51200,0.09953155782487656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,16384,0.05012089014053345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,16384,0.040390223264694214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,12288,0.033477332856920027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,12288,0.03310488992267185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,16384,0.06357777780956693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,10240,0.028414222929212783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,12288,0.0536062220732371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,8192,0.02418311105834113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,10240,0.029456890291637842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,10240,128,0.018894222047593858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,10240,0.04929866724544101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,8192,0.025634666283925373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,65536,0.18194933732350668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,7168,0.021432888176706102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,51200,0.14710577328999838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,6144,0.018552000323931377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,8192,0.044529779089821704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,5120,0.016187555260128446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,7168,0.023388443721665278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,4096,0.013756444056828817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,7168,0.041344000233544245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,6144,0.039769778649012245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,3584,0.013160000244776407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,5120,0.03723377651638455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,5120,0.01953155630164676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,4096,0.03424266642994351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,3072,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,4096,0.018238221605618794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,2560,0.010575110713640848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,3584,0.032462222708596125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,3072,0.01681600014368693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,2048,0.008948444492287105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,3072,0.031376888354619346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,2560,0.03086577852567037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,1536,0.007683555285135905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,2048,0.02956355611483256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,2048,0.014878221684032016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,1024,0.006555555595291986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,1536,0.0270462218258116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,1536,0.013447999954223633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,768,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,1024,0.024847999215126038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,1024,0.012443555725945367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,512,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,768,0.023704888092146978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,256,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,512,0.01205599970287747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,512,0.02158311174975501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,128,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,256,0.011537777880827585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,256,0.020578665865792167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,64,0.0032071111102898917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,128,0.011180444724029966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,8192,128,0.018185777796639335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,8192,32,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,6144,0.02126666737927331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,32,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,65536,0.15352977646721735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,3584,0.017863111363516915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,51200,0.12524178293016222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,2560,0.016150222884284127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,16384,0.04612177941534254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,51200,0.09306133455700344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,16384,0.03826933436923557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,768,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,12288,0.03565866748491923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,16384,0.06326399909125434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,10240,0.027098667290475633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,65536,0.18035111162397596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,51200,0.14590133561028376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,10240,0.027795556518766616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,8192,0.02277244461907281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,8192,64,0.011448000040319232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,10240,0.04857777886920505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,7168,0.020107555720541213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,8192,0.02422133253680335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,8192,0.04345600141419304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,6144,0.01763288842307197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,65536,0.12061066097683376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,7168,0.0417484442392985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,5120,0.015138667490747241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,6144,0.02015644477473365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,6144,0.039228445953793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,4096,0.013091555900043912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,5120,0.01923466722170512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,5120,0.03603377938270569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,3584,0.011330666641394297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,4096,0.017855111095640395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,4096,0.03454755412207709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,3072,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,3584,0.01733688844574822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,3584,0.033203555477990046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,12288,0.031298667192459106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,2560,0.009682666924264696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,3072,0.016723554995324876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,3072,0.03090933296415541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,12288,0.053525331947538585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,2048,0.008936888641781276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,1536,0.0075635554061995606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,2560,0.029911110798517864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,2560,0.015788444214397006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,2048,0.029727111260096233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,1024,0.005256888767083486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,2048,0.01480977733929952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,768,0.004559999952713649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,1536,0.013440888788965015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,1024,0.024686222275098164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,1024,0.012711111042234631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,512,0.0038648889296584656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,768,0.02420444455411699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,7168,0.021538666552967493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,512,0.023366222778956097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,256,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,256,0.021739555729760066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,128,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,64,0.0031786666562159858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,128,0.018207111292415194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,128,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,32,0.003216000066863166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,64,0.011077333655622272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,65536,0.12508355246649847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,32,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,51200,0.0999528898133172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,65536,0.1118675602806939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,7168,1536,0.025590222742822435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,51200,0.08615466621186997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,16384,0.03912711143493652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,768,0.012117333710193634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,16384,0.036708444356918335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,12288,0.032101333141326904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,7168,512,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,10240,0.02847111225128174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,16384,0.06270844406551786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,12288,0.029079112741682265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,65536,0.17970666620466444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,51200,0.14483377668592665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,12288,0.05247377687030368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,8192,0.020385776956876118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,10240,0.025754666990704004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,7168,0.021872889664438035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,10240,0.048278222481409706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,8192,0.0225582222143809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,8192,0.04343377881579929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,7168,0.02069422271516588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,5120,0.016185777054892648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,7168,0.041167110204696655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,6144,0.019536000159051683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,6144,0.038620445463392473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,5120,0.0361422234111362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,5120,0.018351111147138808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,4096,0.03353066576851739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,4096,0.017151110702090792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,3072,0.009645333720578088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,3584,0.01681866745154063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,3072,0.01612444387541877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,3072,0.03185155656602647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,2560,0.008647999829716152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,7168,256,0.003528888854715559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,2560,0.02977333466211955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,2560,0.01579466627703773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,2048,0.007453333172533248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,1536,0.006715555571847492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,2048,0.026737777723206416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,2048,0.013983110586802164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,1024,0.004855999930037392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,1536,0.01312888910373052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,1536,0.026036444637510512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,768,0.0041751112374994485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,6144,0.01942488882276747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,1024,0.01238044434123569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,1024,0.02509511179394192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,512,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,768,0.023010666171709698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,768,0.012092444631788464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,4096,0.014741332994567024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,256,0.0034906665484110513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,512,0.01218311074707243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,128,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,3584,0.012667555775907306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,256,0.011767110890812345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,256,0.020043555233213637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,64,0.002895111011134254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,128,0.011746666497654386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,128,0.01865688959757487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,3584,0.03195910983615451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,64,0.011081777513027191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,6144,32,0.011759111450778114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,65536,0.11582577228546143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,65536,0.1023626658651564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,51200,0.09260800149705674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,16384,0.03356800145573086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,51200,0.07965955469343397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,16384,0.034041778908835515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,12288,0.029838220940695867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,16384,0.06229777468575371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,65536,0.17778310510847303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,10240,0.0247662216424942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,51200,0.14471377266777888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,12288,0.02718933257791731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,6144,512,0.022338666849666174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,12288,0.052357332573996655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,8192,0.020808888806237113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,7168,0.01888444523016612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,10240,0.02379911144574483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,10240,0.047747555706236094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,8192,0.022164444128672283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,8192,0.04271289043956333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,6144,0.014484445254007975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,6144,32,0.003097777772280905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,5120,0.012871999707486896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,7168,0.020246222615242004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,4096,0.011324444578753578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,6144,0.019144889381196763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,5120,0.01818933255142636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,5120,0.03602044449912177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,3584,0.009916444619496664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,4096,0.03264355659484863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,3072,0.009001777403884465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,3584,0.03319733341534933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,3072,0.015503999259736804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,3072,0.03182044294145372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,2560,0.008059555457697975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,2560,0.01407999959256914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,2560,0.029356443219714697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,2048,0.007255111303594377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,1536,0.005930666708283954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,2048,0.01369866645998425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,2048,0.02576622201336755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,1024,0.004249777644872665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,1536,0.012903110848532783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,1536,0.025200888514518738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,768,0.0041999999019834726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,1024,0.02460533380508423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,7168,0.04040266738997565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,768,0.023364444573720295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,512,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,512,0.02130399975511763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,512,0.012028444144460889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,4096,0.016876444220542908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,3584,0.015832889411184523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,128,0.0032337777730491427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,256,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,256,0.021309332715140447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,64,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,128,0.020104888412687514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,128,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,32,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,64,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,65536,0.08734933535257976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,32,0.011207111179828644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,51200,0.07260977559619479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,65536,0.09401777717802261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,1024,0.012129777835475074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,51200,0.07602133353551228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,16384,0.028491556644439697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,5120,768,0.012042666474978128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,5120,6144,0.03847555650605096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,12288,0.023357333408461675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,16384,0.030577778816223145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,65536,0.17831022209591338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,10240,0.01868888901339637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,16384,0.06156177653206719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,5120,256,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,12288,0.02537600033813053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,8192,0.015989333391189575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,12288,0.05220266514354282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,7168,0.014411555396185981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,10240,0.04709955718782213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,10240,0.022740445203251306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,6144,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,8192,0.020845333735148113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,8192,0.04230133361286587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,5120,0.011108444796668159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,7168,0.04032622112168206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,4096,0.010206222534179688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,6144,0.01847999956872728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,6144,0.0379342238108317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,5120,0.01720266706413693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,5120,0.03580977850490146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,3584,0.009012444151772393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,4096,0.032856888241238065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,4096,0.016148444679048326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,3072,0.008383110993438298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,3584,0.014614222778214348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,3584,0.03230311142073737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,2560,0.007532444265153673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,3072,0.01422044469250573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,2048,0.006280000011126201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,2560,0.013593778014183044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,2048,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,2048,0.026322666141721938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,1536,0.004920888692140579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,1536,0.025363556212849084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,1536,0.012711111042234631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,1024,0.00416088890698221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,51200,0.1447297732035319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,768,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,1024,0.024339555038346186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,1024,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,512,0.0034933334423436057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,768,0.023638221952650283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,768,0.012416000167528788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,7168,0.019261333677503798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,256,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,512,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,128,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,512,0.023007111416922674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,256,0.021290666527218286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,64,0.0028479999552170434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,128,0.0195795562532213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,128,0.011347555451922946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,4096,32,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,64,0.011733333269755045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,3072,0.030471109681659277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,65536,0.07685777876112196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,32,0.011019555230935415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,4096,2560,0.02808533443344964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,51200,0.06253333224190606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,16384,0.025803556044896443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,65536,0.09295111232333714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,51200,0.07425600290298462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,12288,0.02051111062367757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,16384,0.029750221305423315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,16384,0.06198844644758436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,12288,0.02397955622937944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,51200,0.14386933379703098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,12288,0.05202577842606438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,8192,0.015509333875444202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,10240,0.022008889251285132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,10240,0.046725332736968994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,7168,0.013620444469981723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,8192,0.02046133412255181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,8192,0.04200622108247545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,6144,0.01221866657336553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,4096,256,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,7168,0.01891288823551602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,7168,0.040758222341537476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,5120,0.010640000303586325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,6144,0.01793955597612593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,6144,0.03773599863052368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,4096,0.009923555784755284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,5120,0.01717333330048455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,5120,0.03565333286921183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,3584,0.008749333520730337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,4096,0.015512888630231222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,4096,0.03245333168241713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,3072,0.008101333346631791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,3584,0.01478488908873664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,2560,0.007599111232492659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,3072,0.013813333378897773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,3072,0.030086222622129653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,2048,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,2560,0.027816888358857896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,2560,0.013400000002649097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,1536,0.004854222138722737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,2048,0.02572000026702881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,10240,0.01790577835506863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,1024,0.003891555385457145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,65536,0.17796622382269967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,1536,0.025750221477614507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,768,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,1024,0.0239991115199195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,1024,0.012475555141766867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,512,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,768,0.012107555237081317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,256,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,512,0.02199466692076789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,512,0.012135110795497894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,128,0.003007111036115222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,256,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,256,0.02069511181778378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,64,0.0028844444702068963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,128,0.011772444678677453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,128,0.0191928893327713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3584,32,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,64,0.010751999914646149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,32,0.011368888947698804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,65536,0.06758755445480347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,3584,0.031110223796632554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,51200,0.055267555846108325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,65536,0.0899626678890652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,2048,0.01278222186697854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,51200,0.07238044341405232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,16384,0.022054221895005967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3584,1536,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,12288,0.018607111440764535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,65536,0.17734311686621773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,16384,0.028896000650193956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,16384,0.061512887477874756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,10240,0.01590844492117564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,51200,0.14374755488501653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,12288,0.023649776975313824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,12288,0.05134133497873942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,8192,0.014153778553009033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,10240,0.04727111260096232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,10240,0.02166755497455597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,8192,0.019606222709019978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,6144,0.012770666844315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,7168,0.04047466648949517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,7168,0.0188755558596717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,5120,0.01033333357837465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,6144,0.017595556047227647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,5120,0.016511999898486666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,4096,0.009429333110650381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,5120,0.03479911221398248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,4096,0.015106666419241162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,3584,0.008339555727110969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,3584,0.014118222726715935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3584,768,0.023082666926913794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,3072,0.007744889292452071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,7168,0.013050666285885705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,3072,0.013803555733627744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,8192,0.04194577866130405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,2560,0.006888888776302338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,3072,0.029094222519132826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,2048,0.005879111174080107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,2560,0.02713866697417365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,2560,0.01308444473478529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,1536,0.005097777893145879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,2048,0.013055110971132914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,2048,0.02644088864326477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,1024,0.004211555752489301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,1536,0.01255555533700519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,1536,0.024688000480333965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,768,0.003830222205983268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,1024,0.024339555038346186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,1024,0.012118221984969245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,512,0.0035422220826148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,4096,0.03291555576854282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,768,0.012049777640236748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,768,0.023014222582181294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,256,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,128,0.002874666617976295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,256,0.020640000700950623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,256,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,64,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,128,0.01110755569405026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,128,0.018529777725537617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,3072,32,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,3584,0.03144888745413886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,65536,0.05888711081610786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,64,0.011074666347768573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,32,0.010992888775136737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,51200,0.04663199848598904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,65536,0.08894222312503391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,16384,0.01997422178586324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,51200,0.06920444303088717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,16384,0.027870221270455256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,6144,0.03754311137729221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,65536,0.17728711499108207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,51200,0.14346222082773843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,16384,0.06127555502785576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,12288,0.016756445169448853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,10240,0.014826666977670459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,8192,0.013111111190583972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,12288,0.023023999399609033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,10240,0.021176889538764954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,10240,0.04719733198483785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,7168,0.012368888490729861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,8192,0.019550222489568923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,8192,0.042131556404961475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,6144,0.011447110937701331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,3072,512,0.022713777091768052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,3072,512,0.011830222275522021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,7168,0.0184906671444575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,7168,0.03987377882003784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,4096,0.008833777573373582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,5120,0.010668444136778513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,6144,0.017501332693629794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,3584,0.008076444268226624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,5120,0.03571733170085483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,5120,0.015797333584891427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,4096,0.03211822112401327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,3072,0.007688889073001013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,4096,0.01477866702609592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,3584,0.030495110485288832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,3584,0.013814222481515674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,2560,0.00658044425977601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,3072,0.028090665737787884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,3072,0.013756444056828817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,2048,0.005281777845488654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,2560,0.013345777988433838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,1536,0.004866666677925321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,2048,0.026216889421145122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,2048,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,1024,0.0041804446114434134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,1536,0.02537600033813053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,1536,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,768,0.0038622220357259116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,1024,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,1024,0.02400622268517812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,512,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,12288,0.05117244521776835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,768,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,256,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,512,0.02157955533928341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,512,0.01182577759027481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,128,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,256,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,256,0.019944889677895438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,64,0.002921777880854077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,6144,0.037744889656702675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,128,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,128,0.018594667315483093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2560,32,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,65536,0.04895200000868904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,64,0.011039999624093374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2560,32,0.010716444088353051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,51200,0.039672000540627375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,65536,0.08580355511771308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,16384,0.018574222922325134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,2560,0.02753688891728719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,51200,0.06660799847708808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,12288,0.015375999940766228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,16384,0.02667466633849674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,65536,0.17821066909366182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,16384,0.06129599942101372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,10240,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,12288,0.023014222582181294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,12288,0.051085333029429116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,8192,0.012608889076444836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,10240,0.020849777592553034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,10240,0.04677955640686882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,7168,0.011633777783976661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2560,768,0.02364088926050398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,8192,0.018534221582942538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,6144,0.010994666980372535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,7168,0.01720977822939555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,7168,0.040243556102116905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,5120,0.01015644437736935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,6144,0.036284443404939436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,6144,0.016545777519543965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,4096,0.008953777452309927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,5120,0.01586844523747762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,5120,0.03390489021937052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,3584,0.007639110916190677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,4096,0.014456000592973499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,4096,0.03120888935195075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,3072,0.0068986668354935115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,3584,0.013920888304710388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,3584,0.03048000070783827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,2560,0.005896889087226655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,3072,0.013779555757840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,3072,0.02877955635388692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,2048,0.0053093334039052325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,2560,0.02677244444688161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,2560,0.013439999686347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,1536,0.004862222406599256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,2048,0.026123555170165166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,1024,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,1536,0.01275644451379776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,51200,0.14385422070821127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,768,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,1024,0.012422222230169507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,1024,0.024331554770469666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,512,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,768,0.02330844435426924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,768,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,256,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,8192,0.04198222359021505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,512,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,128,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,512,0.022755554980701868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,256,0.019949333535300363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,256,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,64,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,128,0.01923022170861562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,2048,32,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,65536,0.03832533293300205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,64,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,32,0.011368888947698804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,51200,0.03018666638268365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,65536,0.08271200127071805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,16384,0.015321777926550971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,51200,0.06498399708006117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,2048,0.01279022213485506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,2048,1536,0.024728000164031982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,51200,0.1442471080356174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,16384,0.026610665851169165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,12288,0.013752889302041797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,16384,0.060489780373043485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,10240,0.012084444363911947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,12288,0.022434666752815247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,12288,0.05141777793566386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,8192,0.011035555766688453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,10240,0.020522667302025687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,10240,0.04634488953484429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,7168,0.010499555203649731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,8192,0.018237334158685472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,8192,0.04050666756100125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,6144,0.009677333136399588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,7168,0.017501332693629794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,7168,0.0377493335141076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,5120,0.009310222334331935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,2048,128,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,6144,0.03608533408906724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,4096,0.008665777742862701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,5120,0.033210668298933245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,5120,0.01512977812025282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,3584,0.00790666706032223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,4096,0.030193779203626845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,3072,0.006600889066855113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,3584,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,3584,0.029814223448435467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,2560,0.00590844452381134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,3072,0.028856890069113836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,3072,0.013835555149449242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,65536,0.17758311165703666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,2048,0.005375111268626318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,2560,0.013139555851618448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,1536,0.004862222406599256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,2560,0.02638133366902669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,2048,0.025939555631743536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,2048,0.012757333616415659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,1024,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,1536,0.024525332782003615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,768,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,1024,0.0243493335114585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,1024,0.012111999922328524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,512,0.0032142222755485107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,768,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,768,0.023424888650576275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,256,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,512,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,512,0.021651556094487507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,128,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,6144,0.016176889340082806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,256,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,64,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,128,0.017864000466134813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1536,32,0.0025351111673646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,4096,0.014466666513019137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,64,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,65536,0.031515555249320135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,32,0.010678222609890832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,51200,0.025722665919197932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,65536,0.07891111241446601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,65536,0.17827110820346406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,51200,0.06227999925613403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,16384,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,51200,0.144543104701572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,1536,0.012504888905419244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,12288,0.010325333310498131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,16384,0.05984622240066528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,10240,0.010474666953086853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,12288,0.02166755497455597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,12288,0.05056533217430115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,8192,0.009174221919642555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,10240,0.01976977785428365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,10240,0.045441776514053345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,7168,0.008980444735950893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,8192,0.017680888374646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1536,256,0.01993955506218804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,8192,0.040538665321138166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,6144,0.007999111380841997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,7168,0.016540444559521146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,7168,0.037992888026767306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1536,128,0.011072888970375061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,5120,0.008385777473449707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,6144,0.03616355525122748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,6144,0.016014221641752455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,4096,0.007324444750944774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,3584,0.007086222370465596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,5120,0.03287555442916022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,5120,0.01513777838812934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,3072,0.006237333433495627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,4096,0.029823111163245306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,4096,0.014092443717850579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,2560,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,3584,0.014117333624098035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,3584,0.02917511264483134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,2048,0.0052639999323421055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,3072,0.028484443823496502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,3072,0.013760888742076026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,1536,0.004541333350870344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,2560,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,2048,0.02513955533504486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,2048,0.01275199982855055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,1536,0.01275466630856196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,1024,0.004004444513056013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,1536,0.024833778540293377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,768,0.003546666767862108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,16384,0.025574222207069397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,1024,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,1024,0.024693333440356787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,768,0.022341334157519873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,768,0.011815999945004782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,256,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,512,0.022656889425383672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,512,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,128,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,256,0.02056711084312863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,256,0.011341333389282227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,64,0.002504000026318762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,32,0.002642666714058982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,128,0.019723556107944913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,128,0.011031111081441244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,65536,0.025822222232818604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,64,0.01072088877360026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,51200,0.02124622298611535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,1024,32,0.010679110884666443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,65536,0.07572888665729098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,16384,0.011344888971911537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,51200,0.06042755312389798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,65536,0.1781360043419732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,51200,0.14338844352298313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,12288,0.009938666390048133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,16384,0.024977778395016987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,16384,0.060121774673461914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,10240,0.010102222363154093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,12288,0.04964977833959791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,12288,0.021095999413066443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,8192,0.008784000244405534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,10240,0.044886221488316856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,10240,0.019259555472267997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,7168,0.007994666695594788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,8192,0.01750666730933719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,8192,0.03940088881386651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,6144,0.0076142218377855085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,1024,512,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,7168,0.016399110356966656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,7168,0.03765155540572272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,6144,0.015501333607567681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,6144,0.03597066799799601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,4096,0.007576888634098901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,5120,0.03254577848646376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,5120,0.014813333749771118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,3584,0.007156444092591603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,4096,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,4096,0.029834667841593426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,3072,0.0069360000391801195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,3584,0.029453333881166246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,2560,0.006821333534187741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,3072,0.013415111435784234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,3072,0.029109332296583388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,2048,0.0052168890833854675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,2560,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,2560,0.026499556170569524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,1536,0.004512888689835866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,2048,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,2048,0.024728000164031982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,1024,0.0039057777159743835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,1536,0.01237422227859497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,1024,2560,0.02847377790345086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,768,0.003527111063400904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,1024,0.012062222593360476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,1024,0.02365422248840332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,512,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,768,0.022597332795461018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,768,0.012120889292822944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,256,0.0030168888883458245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,5120,0.008126222425036961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,512,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,512,0.021538666552967493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,128,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,256,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,128,0.018368000785509746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,64,0.0026142222599850762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,128,0.0110880004035102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,768,32,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,65536,0.019573332534896005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,3584,0.013816888961527081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,64,0.010495999621020423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,768,32,0.01036000003417333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,51200,0.01566844516330295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,65536,0.07388266589906481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,16384,0.011101333631409539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,51200,0.05957066350513034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,65536,0.17697244220309785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,51200,0.14272711012098524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,12288,0.009015111459626092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,16384,0.024733333124054804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,16384,0.05831466780768501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,10240,0.009158222211731805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,12288,0.04861688945028517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,12288,0.020769778225156996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,8192,0.008285333712895712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,10240,0.018927110566033255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,10240,0.04459822177886963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,7168,0.007839110990365347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,8192,0.017154667112562392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,6144,0.007322666545708974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,7168,0.01668711172209846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,7168,0.037420445018344455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,5120,0.007937777373525832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,6144,0.01551999979548984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,6144,0.03566755519972907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,256,0.020012444920010038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,4096,0.007344000041484833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,5120,0.014793778459231058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,5120,0.0325288905037774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,3584,0.0069360000391801195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,4096,0.03084533413251241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,3072,0.006633777585294511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,3584,0.02946044339074029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,3584,0.013516444298956128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,2560,0.006578666468461354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,3072,0.028320001231299505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,3072,0.013790222505728403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,2048,0.006276444428496891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,2560,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,2560,0.026576000783178542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,1536,0.004513777792453766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,2048,0.013101333545313941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,768,1536,0.025303999582926433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,1024,0.003912888881233004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,1536,0.012110222544935016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,1536,0.026428444517983332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,768,0.0035217776894569397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,1024,0.012421333127551608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,8192,0.04003466831313239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,1024,0.02336888843112522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,512,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,768,0.02366488840844896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,256,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,512,0.022659555077552795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,512,0.011411555939250521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,128,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,256,0.021087111698256597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,256,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,64,0.0024871110088295406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,128,0.01074488874938753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,512,32,0.002507555608948072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,4096,0.014103111293580798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,65536,0.015093333191341825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,64,0.011404444773991903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,32,0.010077333284748925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,51200,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,65536,0.07204444540871514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,65536,0.17713777224222818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,16384,0.009656888743241629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,51200,0.05795911285612318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,2048,0.025401777691311304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,51200,0.1430071062511868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,16384,0.024350222614076402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,16384,0.058132443163130015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,10240,0.007655999726719326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,12288,0.02058844433890449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,12288,0.04863288998603821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,8192,0.007304888632562425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,512,768,0.0121760004096561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,10240,0.04384533233112759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,7168,0.006636444479227066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,8192,0.017509332961506315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,8192,0.04011111127005683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,6144,0.006601777755551868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,7168,0.016161777906947665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,7168,0.03770844472779168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,5120,0.006301333506902059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,6144,0.0158906661801868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,6144,0.034993777672449745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,4096,0.006647999915811751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,5120,0.015139554937680563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,5120,0.03341333402527703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,3584,0.0063368889192740125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,4096,0.014104000396198697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,4096,0.030823998981051978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,3072,0.006295111030340195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,3584,0.014156444205178155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,3584,0.028841776980294123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,12288,0.008336000144481659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,3072,0.013802666631009845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,3072,0.028736889362335205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,2048,0.006317333214812809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,2560,0.013076444466908773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,2560,0.02751022246148851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,1536,0.00424177779091729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,10240,0.018906666172875296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,2048,0.013073777986897362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,2048,0.025071110990312364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,1024,0.0038577777643998465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,1536,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,1536,0.024340444140964087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,768,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,1024,0.011920000116030375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,1024,0.024988444315062627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,512,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,768,0.02336799932850732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,768,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,256,0.0028799999919202593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,512,0.012076444096035428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,128,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,256,0.011095999843544431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,256,0.021651556094487507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,64,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,128,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,128,0.01789777808719211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,32,0.0026746667507621977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,64,0.011543110840850405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,256,32,0.01016355554262797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,256,2560,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,51200,0.013068444199032254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,65536,0.07102133168114556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,65536,0.17635733551449248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,51200,0.05688266621695625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,16384,0.007937777373525832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,51200,0.14253777927822536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,12288,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,16384,0.058112886216905385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,16384,0.0237128883600235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,10240,0.007279111279381647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,12288,0.020928000410397846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,12288,0.04823377728462219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,8192,0.007276444799370236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,512,128,0.019274666905403137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,10240,0.018889778190188937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,10240,0.044469333357281156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,256,512,0.02204622162712945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,8192,0.039714667532179095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,6144,0.006612444503439798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,7168,0.03731733229425218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,65536,0.014716444744004143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,6144,0.015791111522250705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,6144,0.034918222162458636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,5120,0.005981333139869902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,4096,0.005988444305128521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,5120,0.03257511059443156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,5120,0.015127110812399121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,3584,0.006233777850866318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,4096,0.014498665928840637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,4096,0.029750221305423315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,3072,0.00592533333433999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,3584,0.029767112599478826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,3584,0.014098667436175875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,2560,0.006504888749784893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,3072,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,3072,0.028825776444541082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,2048,0.005943999936183293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,2560,0.013418667018413544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,2560,0.026730666557947796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,1536,0.0042444442709287005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,2048,0.02643022272321913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,2048,0.013097777962684631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,7168,0.006823110911581252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,1024,0.003866666720973121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,1536,0.01237422227859497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,8192,0.016876444220542908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,1536,0.025360888904995386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,768,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,1024,0.025053333905008104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,512,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,7168,0.016786666380034555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,256,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,768,0.02367111047108968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,768,0.011688888900809817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,512,0.02183466653029124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,128,0.00258933338854048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,512,0.012088889049159156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,64,0.002514666567246119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,256,0.021028444170951843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,128,32,0.002537777854336633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,64,128,128,0.017504000001483493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,128,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,65536,0.011026666396194033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,64,0.011753777662913004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,51200,0.009665778113736046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,32,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,16384,0.007261333366235097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,12288,0.006614222294754452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,65536,0.07004088825649686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,10240,0.006279110908508301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,51200,0.05558933152092827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,8192,0.0062871111763848206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,16384,0.0239955551094479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,12288,0.020597333709398907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,6144,0.0062977779242727495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,10240,0.018958222534921434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,5120,0.005973333285914526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,7168,0.016533333394262526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,4096,0.005945777727497949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,6144,0.015311999453438653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,5120,0.01479555500878228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,3584,0.005940444353553984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,3072,0.005555555638339784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,4096,0.014188443620999655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,3584,0.01347555551264021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,1024,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,2560,0.00629333323902554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,2048,0.005600888695981767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,2560,0.013060444758998023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,1536,0.0042364444169733255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,128,256,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,1024,0.003679111186001036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,1536,0.012342222034931183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,768,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,1024,0.012240889171759287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,512,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,768,0.011772444678677453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,256,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,512,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,128,0.002499555548032125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,8192,0.01754044493039449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,256,0.011317333413494958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,64,0.0025235555238193935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,128,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,32,0.002663111107216941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,65536,0.011056889262464313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,64,0.0107004443804423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,51200,0.009706666900051964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,65536,0.06775910986794366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,3072,0.013249778085284762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,16384,0.007368000017272101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,51200,0.05496355560090807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,12288,0.006626666833957036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,10240,0.006263999889294307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,16384,0.02367199957370758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,2048,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,8192,0.006288888967699475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,12288,0.020414221617910597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,7168,0.006137777947717243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,10240,0.01960088809331258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,6144,0.005906666732496685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,5120,0.005910222315125995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,8192,0.01717066599263085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,7168,0.016223111086421542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,4096,0.005571555760171678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,6144,0.015841777125994366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,3584,0.006232888748248418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,3072,0.005889777921968036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,5120,0.014797333214018079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,2560,0.005947555518812603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,4096,0.014127999544143677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,64,7168,0.006268444574541516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,3584,0.014182221558358936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,2048,0.005554666535721884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,3072,0.013416888813177744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,1536,0.004264889078007804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,1024,0.0035546666218174826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,2560,0.012794666820102267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,768,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,512,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,2048,0.012719111310111152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,1536,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,256,0.00254133323000537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,1024,0.012445333103338877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,128,0.002532444480392668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,768,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,64,0.0025128889828920364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,512,0.011401777466138205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,256,0.011067555182509951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,128,0.010693333215183683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,64,0.010695999695195092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,32,32,0.010276444256305695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,16384,0.17666133244832358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,12288,0.27218132548862034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,51200,0.5187528928120931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,12288,0.13372800085279676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,10240,0.2304640081193712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,10240,0.11453066931830512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,8192,0.1882364484998915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,8192,0.09812000062730576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,51200,1.1224337683783638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,7168,0.16257511244879827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,64,32,32,0.0025031111306614345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,64,64,32,0.011051555474599203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,6144,0.13805422517988417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,7168,0.08406044377221002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,3584,0.08472088972727458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,5120,0.06455466482374403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,4096,0.09611377451154922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,4096,0.0547964440451728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,3072,0.0730817781554328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,16384,0.36924089325798887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,6144,0.07460444503360324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,3072,0.04499288731151157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,2560,0.04091644287109375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,1536,0.039840890301598444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,2048,0.03561955690383911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,1024,0.0292195545302497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,768,0.02234577801492479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,1536,0.030829333596759375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,512,0.015300444430775113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,1024,0.024502222736676533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,256,0.009398221969604492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,768,0.020777778493033517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,512,0.017865777015686035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,128,0.006271111054552927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,256,0.015789333317014907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,64,0.007306666837798224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,128,0.014807111687130399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,64,0.014648000399271647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,32,0.007664889097213745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,32,0.01848266687658098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,65536,3584,0.04987200101216634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,5120,0.11893599563174778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,2560,0.061900443500942655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,65536,2048,0.05119911167356703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,16384,0.2755964332156711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,16384,0.14381689495510525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,65536,0.5459404521518284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,51200,0.4200391239590115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,12288,0.20775555239783394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,10240,0.1732391119003296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,12288,0.10994933048884074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,65536,1.0861066182454426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,10240,0.0942666663063897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,51200,0.8513075510660807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,8192,0.14013689094119602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,7168,0.12387111451890732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,6144,0.10677866803275214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,8192,0.08064622349209256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,5120,0.09067822164959377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,3584,0.06526044342252943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,4096,0.07387555307812162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,7168,0.07030844688415527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,3072,0.0573564436700609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,6144,0.06240799691942003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,5120,0.05450488792525398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,4096,0.04660711023542616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,3584,0.042783111333847046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,3072,0.038690666357676186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,1536,0.030797332525253296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,2048,0.03912711143493652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,2560,0.0481333335240682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,1024,0.023041778140597876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,768,0.016875555117925007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,2048,0.03137600090768602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,512,0.012231999801264869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,1536,0.02713866697417365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,256,0.008265777594513362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,128,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,768,0.019024888674418133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,1024,0.020644444558355544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,256,0.014477334088749357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,32,0.004872000051869286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,128,0.013807999591032663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,64,0.014106666048367819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,32,0.017550221747822232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,65536,0.20839644802941215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,51200,0.15738756126827663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,51200,0.27172711160447865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,16384,0.08321422338485718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,12288,0.06450577576955159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,16384,0.06034488810433281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,10240,0.053267555104361645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,12288,0.047162665261162647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,8192,0.04518311222394308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,10240,0.041534221834606595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,7168,0.03882133298450046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,2560,0.03485066692034403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,8192,0.03670577870474921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,6144,0.034103999535242714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,7168,0.032708442873424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,6144,0.03020533257060581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,51200,512,0.016826666063732572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,51200,64,0.004513777792453766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,4096,0.02591288917594486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,5120,0.027442667219373915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,3584,0.021820444199774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,3072,0.01906399925549825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,2560,0.016564443707466125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,4096,0.024167999625205994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,3584,0.022295110755496558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,3072,0.020563556088341605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,1536,0.011161777708265515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,1024,0.008623110751310984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,2560,0.019870221614837646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,2048,0.018194667167133756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,768,0.007245333658324347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,512,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,65536,0.35184444321526426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,768,0.013752889302041797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,256,0.004023111114899318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,1024,0.014489778214030795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,128,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,256,0.012092444631788464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,64,0.0032302221904198327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,32,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,128,0.011693333586057028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,64,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,32,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,5120,0.029394666353861492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,65536,0.27096888754102916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,51200,0.212208006117079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,65536,0.17944710784488252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,16384,0.07634044355816312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,16384,2048,0.013564444250530668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,12288,0.05246666736072964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,51200,0.13891911506652832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,16384,0.0527688894006941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,10240,0.043656888935301036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,8192,0.037775112522972956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,12288,0.042265776130888194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,7168,0.03216088811556498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,1536,0.016947555873129103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,10240,0.0377075539694892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,6144,0.027793778313530818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,5120,0.02427911096149021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,8192,0.033244444264305964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,7168,0.029971556531058416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,4096,0.020336000455750358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,3584,0.017737777696715463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,6144,0.027405333187845018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,16384,512,0.013088000317414602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,3072,0.015840889679061044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,5120,0.023718222975730896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,2560,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,4096,0.02154133386082119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,2048,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,1536,0.009683555199040307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,3072,0.01956266661485036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,3584,0.020855110552575853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,1024,0.008088000118732452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,2560,0.018516444497638278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,768,0.006648889018429651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,512,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,2048,0.017881777551439073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,256,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,1536,0.016176000237464905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,128,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,1024,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,768,0.01329066687160068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,64,0.00327822214199437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,512,0.012759110993809171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,256,0.012123555772834353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,12288,32,0.003567111161020067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,128,0.011428444749779172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,64,0.011691555380821228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,12288,32,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,16384,0.06297689014010958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,51200,0.17356622219085693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,65536,0.22068444887797037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,12288,0.04204622242185804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,65536,0.16971377531687418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,51200,0.13249866167704263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,16384,0.05087822344568041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,10240,0.03511111272705926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,8192,0.03014933400683933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,7168,0.025791999366548326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,6144,0.022671999202834234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,12288,0.04077600108252631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,10240,0.0364951127105289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,8192,0.03236177894804213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,7168,0.029027554723951552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,4096,0.01644977761639489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,3584,0.014449778530332776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,3072,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,6144,0.026554667287402686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,3584,0.020083554916911654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,2560,0.01129155523247189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,2048,0.009685333404276106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,3072,0.01904355486234029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,1536,0.008270222279760573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,1024,0.0069004446268081665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,2048,0.017200888858901132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,768,0.0052044445441828836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,1536,0.015125332607163323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,512,0.004357333398527569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,1024,0.013460444079505073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,768,0.013460444079505073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,512,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,128,0.0032239999208185407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,256,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,64,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,128,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,32,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,64,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,5120,0.019879110985332064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,32,0.012112889024946423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,65536,0.17885511451297334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,5120,0.023079110516442194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,4096,0.020920889245139226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,51200,0.14367466502719456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,16384,0.04951644606060452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,65536,0.12187377611796062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,12288,0.036610666248533465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,10240,0.030776888132095337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,10240,2560,0.018176888426144917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,16384,0.0391866664091746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,51200,0.09457511372036403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,8192,0.02604444490538703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,12288,0.03161599900987413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,7168,0.02295200030008952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,5120,0.017498667041460674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,6144,0.01997244523631202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,10240,0.028547555208206177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,4096,0.01481066644191742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,6144,0.02095555596881443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,10240,256,0.0035546666218174826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,3584,0.013033777475357056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,5120,0.019367999500698514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,3072,0.011854222251309289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,2560,0.010603555374675326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,4096,0.017851556340853374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,2048,0.0090506664580769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,3584,0.01763911048571269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,3072,0.01683644453684489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,1536,0.007655999726719326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,2560,0.01646311084429423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,1024,0.005958222266700532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,768,0.004555555681387584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,2048,0.0147706667582194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,1536,0.013791110780504016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,512,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,256,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,1024,0.012489777472284106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,128,0.0031848889258172777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,512,0.012067555553383298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,256,0.011408000356621213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,64,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,128,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,64,0.011367110742463006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,32,0.012087999946541257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,65536,0.16087199581993952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,8192,0.023945776952637568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,65536,0.11162400245666504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,7168,0.022329777479171753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,51200,0.12757333119710287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,16384,0.047016001409954496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,12288,0.034203555848863386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,10240,0.028816888729731243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,51200,0.08763111299938625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,16384,0.03717422154214647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,8192,0.02462133268515269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,12288,0.030029333300060693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,7168,0.02124799953566657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,6144,0.01869333287080129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,10240,0.02680711117055681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,8192,0.022967111733224656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,5120,0.016138666205936007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,7168,0.020961778031455144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,4096,0.013735111388895245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,3584,0.012353777885437012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,6144,0.02017155620786879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,8192,768,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,3072,0.011129777464601727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,4096,0.017496888836224873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,3584,0.01717155509524875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,8192,32,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,2048,0.008839111361238692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,1536,0.007257777783605788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,2560,0.015440000428093804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,1024,0.0052488889131281115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,2048,0.013793778088357715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,768,0.004228444563017951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,1536,0.013428444663683573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,512,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,768,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,256,0.0035422220826148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,512,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,128,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,256,0.011719110939237805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,64,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,128,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,32,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,64,0.0110880004035102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,32,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,65536,0.14090222782558864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,7168,2560,0.010034666293197209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,65536,0.10463911294937134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,51200,0.1116480032602946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,3072,0.016561778055297006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,16384,0.03996888796488444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,12288,0.032616890139049955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,10240,0.028360890017615423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,51200,0.08137777778837416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,16384,0.03485688898298476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,12288,0.027913779020309448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,8192,0.025119110941886902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,7168,0.02223555578125848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,6144,0.01685599982738495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,10240,0.0239982224173016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,5120,0.015090665883488126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,8192,0.0229751103454166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,7168,0.02036266691154904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,4096,0.013248888982666863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,3584,0.011553777588738335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,6144,0.019553777244355943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,5120,0.018068444397714403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,3072,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,2560,0.009335999687512716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,4096,0.017058667209413316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,3584,0.01682400041156345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,2048,0.00757155567407608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,3072,0.015915556086434256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,1536,0.006322666588756774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,2560,0.01479822231663598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,2048,0.013464888764752282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,1536,0.013080000049538083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,768,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,512,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,1024,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,256,0.003236444460021125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,768,0.012457778056462606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,128,0.002871111035346985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,512,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,5120,0.018797333041826885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,64,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,256,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,32,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,128,0.011117333339320289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,64,0.011739555332395764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,6144,32,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,65536,0.11957332823011611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,16384,0.035707556539111666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,51200,0.09516888856887817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,65536,0.09656355778376262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,7168,1024,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,51200,0.07523022095362346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,12288,0.028130667077170476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,10240,0.02436977790461646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,8192,0.020620443754725985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,12288,0.02631644407908122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,10240,0.02320266597800785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,7168,0.018932445181740653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,8192,0.021073778470357258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,6144,0.015855110353893705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,5120,0.014115555418862237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,7168,0.019510222805870902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,4096,0.01237066669596566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,3584,0.010772444307804108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,6144,0.018935999936527677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,6144,1024,0.004580444345871608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,5120,0.017608889275126986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,2560,0.008623999853928884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,4096,0.01657777859105004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,2048,0.0069617778062820435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,3072,0.014783110883500842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,1536,0.0057795556883017225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,2560,0.014131555954615274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,2048,0.013112000293201871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,1024,0.004541333350870344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,768,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,1536,0.013063111239009433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,512,0.00360000009338061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,1024,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,256,0.003481777591837777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,768,0.01275022245115704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,128,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,512,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,64,0.0028799999919202593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,256,0.011633777783976661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,32,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,128,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,64,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,16384,0.03229688935809665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,32,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,65536,0.09676266378826565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,16384,0.02840977907180786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,51200,0.07369510995017158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,65536,0.08928622139824761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,12288,0.02272622287273407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,51200,0.07133866680992974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,5120,3072,0.009972444838947719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,10240,0.020018666982650757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,16384,0.029613332615958318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,12288,0.02369955513212416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,8192,0.01738577749994066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,7168,0.015809777710172866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,5120,3584,0.015971556305885315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,10240,0.02164799968401591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,6144,0.012430222498046027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,5120,0.011301333705584208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,4096,0.00999111102686988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,8192,0.020247111717859905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,3584,0.008959111240175035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,7168,0.01885777711868286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,3072,0.008263111114501953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,6144,0.01795288920402527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,5120,0.017159110969967313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,4096,0.015460444821251763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,2048,0.006224000205596288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,3584,0.015083556373914083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,1536,0.004931555440028508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,3072,0.013551111022631327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,1024,0.004181333300140169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,2560,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,512,0.0035217776894569397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,2048,0.013086222112178802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,1536,0.013086222112178802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,256,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,768,0.012426666915416718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,128,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,64,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,512,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,256,0.011420444481902652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,32,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,128,0.01110666659143236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,64,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,65536,0.07915111382802327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,32,0.011197333534558615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,51200,0.0640044477250841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,65536,0.08650577730602688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,16384,0.026379555463790894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,12288,0.021232888102531433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,51200,0.06943111287222968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,10240,0.018410666121376883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,16384,0.028149333265092637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,12288,0.023008000519540574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,8192,0.01622222198380364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,7168,0.013743999931547375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,10240,0.021430222524536982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,6144,0.01202133297920227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,2560,0.00758844448460473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,8192,0.019946666227446664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,7168,0.01851466629240248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,6144,0.01751733322938283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,4096,768,0.0037537775933742523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,4096,0.00997688869635264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,3584,0.008643555144468943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,5120,0.01703644461101956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,3072,0.00798044436507755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,4096,1024,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,2048,0.0059075554211934405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,4096,0.01460800071557363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,3584,0.014490667316648694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,1536,0.004573333180612988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,3072,0.014112888111008538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,1024,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,768,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,2048,0.012748444245921241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,512,0.003522666792074839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,1024,0.01256444470749961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,256,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,768,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,128,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,512,0.012076444096035428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,64,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,256,0.011781333221329583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,128,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,64,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,65536,0.06999822457631429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,32,0.012072000238630505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,51200,0.05634578069051107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,16384,0.02251911163330078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,65536,0.08451377683215672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,5120,0.010662222074137794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,51200,0.06752177741792467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,12288,0.019485332899623446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,10240,0.016348444753222995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,16384,0.02717777755525377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,8192,0.01460622251033783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,7168,0.013416888813177744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,10240,0.020921778347757127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3584,2560,0.00720888872941335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,6144,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,5120,0.01034400032626258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,8192,0.019484443797005545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,4096,0.009300444689061906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,2560,0.013426666458447775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,6144,0.017308443784713745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,3584,0.008274666965007782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,3072,0.007576000359323289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,5120,0.016192888220151264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3584,1536,0.013071999781661563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,2560,0.006370666540331311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,2048,0.005790222022268508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,3072,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,2560,0.013460444079505073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,2048,0.012741333080662621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,1024,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,1536,0.01290844463639789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,768,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,1024,0.012107555237081317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,512,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,768,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,256,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,512,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,128,0.002979555477698644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,256,0.011748444702890186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,64,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,12288,0.022631110416518316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,128,0.01108266661564509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,32,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,64,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,7168,0.01819644371668498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,32,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,51200,0.04814044303364224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,16384,0.020455110404226515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,65536,0.08191555738449097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,3584,0.014101333088344999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,51200,0.0656764441066318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,12288,0.01723022262255351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,10240,0.014631999863518609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,3072,1536,0.004882666799757215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,16384,0.026408000124825373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,8192,0.013430222041077085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,12288,0.022227555513381958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,7168,0.012483555409643384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,10240,0.0206995556751887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,6144,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,8192,0.01917866700225406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,5120,0.0107342220014996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,7168,0.01789155602455139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,6144,0.016789333687888253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,3584,0.007867555651399825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,5120,0.015848888291252982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,4096,0.014146667387750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,3072,0.007310222420427535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,2560,0.006236444330877728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,3584,0.014129777749379476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,2048,0.0052720002002186244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,3072,0.013404444687896304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,1536,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,2560,0.013772444592581855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,1024,0.004211555752489301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,2048,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,768,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,1536,0.01273333364062839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,65536,0.059976001580556236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,512,0.003564444267087512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,1024,0.012465777496496836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,256,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,128,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,768,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,3072,4096,0.014447111222479077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,64,0.002974222310715251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,256,0.011905777785513135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,32,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,128,0.011350221931934357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,65536,0.05156977640257942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,64,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,51200,0.04078222314516703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,32,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,16384,0.0185244447655148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,65536,0.0786364475886027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,12288,0.015207999282413058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,51200,0.06379466586642794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,10240,0.013725333743625216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,16384,0.02583644456333584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,8192,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,12288,0.021990221407678392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,10240,0.02035466664367252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,6144,0.010690666735172272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,7168,0.017264000243610807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,5120,0.009931555224789513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,6144,0.015801777442296345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,4096,0.008866666919655269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,5120,0.015055111712879606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,3584,0.007595555649863348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,4096,0.014147554834683737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,3072,0.006785777707894643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,3584,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2560,512,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,2560,0.0058808889653947614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,2048,0.0052639999323421055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,3072,0.013417777915795645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,1536,0.004770666774776247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,2560,0.013432000246312885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,1024,0.0038773334688610504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,1536,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,768,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,1024,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2560,4096,0.009032888544930352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,512,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,256,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,768,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,128,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,8192,0.0188773340649075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,64,0.0028515555378463534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,128,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,32,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,64,0.011275555524561139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,65536,0.039734221167034574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,32,0.011063999599880643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,51200,0.03188622328970168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,65536,0.07636711332533094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,16384,0.01529600057337019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,12288,0.01330488920211792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,16384,0.025444444682863023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,10240,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,2048,0.012732444538010491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,12288,0.0218551109234492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,8192,0.010755555497275459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,7168,0.010417777631017896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,10240,0.019932443896929424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,8192,0.0173973325226042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,6144,0.00965244405799442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,5120,0.008904000123341879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,7168,0.016549333930015564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,2048,7168,0.011352000137170156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,4096,0.008447111480765873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,3584,0.007652444144090016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,6144,0.01588800052801768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,5120,0.015141333142916361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,256,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,3072,0.006264888991912206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,4096,0.014101333088344999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,2560,0.005917333480384614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,3584,0.014051554931534661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,2048,0.0052800000541739995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,1536,0.004551110996140374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,3072,0.013435555828942193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,1024,0.0038808890514903595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,2560,0.013438222308953604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,768,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,2048,0.01276177747382058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,512,0.0031973332580592898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,1024,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,256,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,768,0.012443555725945367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,128,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,512,0.011772444678677453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,64,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,51200,0.061624891228146024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,256,0.011409777734014722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,128,0.011553777588738335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,64,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,65536,0.029382222228580054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,51200,0.024975111087163288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,32,0.011053333679835001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,16384,0.012716444830099741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,65536,0.07302133242289226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,12288,0.010334221853150262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,51200,0.05743288993835449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,16384,0.02437155610985226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,10240,0.010682666467295753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,2048,512,0.012073777616024017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,12288,0.020595555504163105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,10240,0.018573333819707234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,8192,0.016827555166350473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,6144,0.01034311122364468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,7168,0.016182222300105624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,5120,0.009112888740168678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1536,1536,0.013088888592190213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,6144,0.015470221638679504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,4096,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,3584,0.006960888703664144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,5120,0.01477866702609592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,3072,0.00639111093348927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,4096,0.014125333891974555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,2560,0.00591466658645206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,3584,0.014427555931939019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1536,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,2048,0.0052391112678580815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,3072,0.013390222357379066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,1536,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,2560,0.013085333009560903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,1024,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,2048,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,1536,0.012698666916953193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,512,0.003481777591837777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,1024,0.011771555576059552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,768,0.012284444438086616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,256,0.0031439999325407874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,128,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,512,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,8192,0.009648000200589498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,256,0.01143555591503779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,32,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,128,0.011072888970375061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,7168,0.00868000007337994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,64,0.01071999967098236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,51200,0.021140444609853957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,1024,32,0.010737777584128909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,16384,0.011011555790901184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,12288,0.009696889254781935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,65536,0.07016266716851129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,10240,0.010336000058386061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,16384,0.023708444502618577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,8192,0.008911111288600499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,10240,0.018251554833518136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,7168,0.007979555262459649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,8192,0.016916443904240925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,6144,0.007622222105662028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,7168,0.01615111033121745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,5120,0.008052444292439355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,6144,0.0155102229780621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,1024,768,0.0035422220826148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,4096,0.007598222129874759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,3584,0.0069751110341813825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,5120,0.014767999450365702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,3072,0.006299555715587404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,3584,0.013803555733627744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,2560,0.0058853332367208265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,3072,0.013424889081054263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,2048,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,65536,0.0255039996571011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,2560,0.01311822235584259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,1536,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,1024,0.003863111138343811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,2048,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,768,0.003546666767862108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,1536,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,51200,0.056074665652381055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,1024,0.012084444363911947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,512,0.0034506666577524612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,256,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,768,0.012120000190205045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,128,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,512,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,64,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,256,0.011397333608733283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,768,32,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,128,0.011046222514576383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,65536,0.0188755558596717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,64,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,51200,0.015463999576038785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,32,0.011173333558771344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,16384,0.010584000084135266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,12288,0.008984000318580205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,65536,0.06799733638763428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,51200,0.05531822310553657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,16384,0.023364444573720295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,10240,0.009327111144860586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,8192,0.008271111382378472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,4096,0.014466666513019137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,12288,0.019606222709019978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,7168,0.009349333743254343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,6144,0.008638222184446123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,10240,0.01852888862291972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,5120,0.008620444271299574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,8192,0.016882666283183627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,4096,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,7168,0.016520000166363187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,3584,0.006934222247865465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,3072,0.006237333433495627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,5120,0.01478666729397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,4096,0.013819555441538492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,2560,0.005557333429654439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,3584,0.014450665977266101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,2048,0.004866666677925321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,1536,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,2560,0.01313866674900055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,1024,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,2048,0.013108444710572561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,1536,0.01276533305644989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,768,12288,0.01995733380317688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,768,0.003528000166018804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,512,0.0034942221310403612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,256,0.00319377767542998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,1024,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,128,0.0025191110455327565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,768,0.01239377756913503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,512,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,64,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,512,32,0.002543111021320025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,256,0.01145866678820716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,128,0.011054221954610614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,64,0.010685332947307162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,32,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,65536,0.06669333246019152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,16384,0.009927999642160203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,51200,0.054752889606687755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,12288,0.009664889011118147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,16384,0.023095111052195232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,6144,0.015164444843928019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,10240,0.008804444637563493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,12288,0.019738665885395475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,8192,0.008295999632941352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,7168,0.008967111508051554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,6144,0.008283555507659912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,10240,0.018220444520314533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,512,3072,0.013092444174819522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,5120,0.007958222594526079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,8192,0.016826666063732572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,4096,0.0076044441925154785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,7168,0.016520889268981088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,3584,0.006625777731339137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,6144,0.015470221638679504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,3072,0.006224000205596288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,5120,0.014449778530332776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,2560,0.006031111296680238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,4096,0.014123555686738757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,3584,0.014149333039919535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,1536,0.004545777622196409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,2560,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,1024,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,1536,0.01276177747382058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,768,0.0035217776894569397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,1024,0.011782222323947482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,51200,0.01514400045077006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,512,0.0032186667538351486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,256,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,768,0.01239377756913503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,128,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,256,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,64,0.002708444371819496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,128,0.011694221860832639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,32,0.002579555536309878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,64,0.0107342220014996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,65536,0.014813333749771118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,32,0.011390222443474663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,65536,0.06480889187918769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,2048,0.004911111046870549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,3072,0.013145777914259167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,16384,0.009356444080670675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,2048,0.012772444221708508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,51200,0.05150666501786974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,12288,0.009338666995366415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,256,65536,0.015800888339678448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,10240,0.008795555267069075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,8192,0.007984889050324758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,16384,0.022980444961124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,7168,0.007320889168315464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,12288,0.019313777486483257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,6144,0.007310222420427535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,10240,0.018579555882347953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,5120,0.008000888758235509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,8192,0.016879111528396606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,4096,0.007400888535711501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,256,512,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,7168,0.015912888778580558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,3584,0.006962666908899943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,6144,0.015223999818166098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,3072,0.006270222365856171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,5120,0.015083556373914083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,2560,0.006220444622966979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,4096,0.014143110977278816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,3584,0.013773333695199756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,1536,0.004516444272465176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,3072,0.01310755560795466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,1024,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,768,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,1536,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,1024,0.012040889097584618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,512,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,768,0.012372444073359171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,512,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,128,0.002532444480392668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,51200,0.014101333088344999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,256,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,64,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,32,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,128,0.010676444404655032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,64,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,65536,0.016171556380059984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,32,0.010348444183667501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,51200,0.01516533394654592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,16384,0.008610666626029545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,65536,0.0624835557407803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,12288,0.00815822184085846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,51200,0.05102133419778612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,16384,0.02276444435119629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,10240,0.007596444752481248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,8192,0.006591111007663939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,12288,0.019687111179033916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,10240,0.01791200041770935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,7168,0.006577777779764599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,2048,0.0059368887709246735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,6144,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,5120,0.006909333169460297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,2560,0.01311377767059538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,128,2048,0.012687111066447364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,4096,0.006280888699822956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,7168,0.01579466627703773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,3584,0.005965333431959152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,6144,0.015608888533380298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,3072,0.00591111100382275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,2560,0.005951111101441913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,128,256,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,4096,0.013776000175211163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,3584,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,2048,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,1536,0.004503111044565837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,3072,0.013809777796268463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,1024,0.003830222205983268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,2560,0.013080000049538083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,768,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,2048,0.012736000120639801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,512,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,1536,0.012453333371215396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,256,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,1024,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,128,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,64,0.002518222149875429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,512,0.011772444678677453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,256,0.011072888970375061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,64,32,0.002471999989615546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,128,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,65536,0.015909334023793537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,64,0.010327111515733931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,51200,0.01482399966981676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,16384,0.00868800034125646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,32,0.0107360002067354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,12288,0.007992888490358988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,65536,0.06257688999176025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,51200,0.0510044429037306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,10240,0.007661333514584436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,8192,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,16384,0.022868444522221882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,7168,0.006594666590293248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,12288,0.019559999306996662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,10240,0.01789422167672051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,8192,0.016487111647923786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,6144,0.006274666637182236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,8192,0.017129777206314933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,5120,0.006253333141406377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,7168,0.015814221567577787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,4096,0.005952000204059813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,3584,0.005949333310127258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,6144,0.015145777000321282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,5120,0.0151591118839052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,3072,0.005595555735958948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,5120,0.01478666729397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,4096,0.013937777943081327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,2560,0.00590133335855272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,2048,0.005722666780153911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,3584,0.013770666387346057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,1536,0.0041991112132867174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,3072,0.013782222237851886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,1024,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,2560,0.013444444371594323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,768,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,512,0.00314666661951277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,1536,0.012411555482281579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,256,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,64,768,0.01205599970287747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,128,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,512,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,64,0.0024968888610601425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,256,0.01070755554570092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,49,32,32,0.002500444443689452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,128,0.010696888797812991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,64,0.01038755559258991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,32,0.010339555641015371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,51200,0.5168968836466471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,2048,0.012416889270146688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,16384,0.36394309997558594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,1024,0.01240533341964086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,49,32,768,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,16384,0.17688711484273276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,51200,1.1241209242078993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,12288,0.27232087983025444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,12288,0.1340142223570082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,10240,0.23124088181389701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,8192,0.18442400296529135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,10240,0.11437866422865127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,8192,0.09724799791971843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,7168,0.16178399986690944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,7168,0.0838773316807217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,6144,0.14066489537556967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,6144,0.07438933187060885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,12288,0.22108177344004312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,10240,0.18447021643320718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,8192,0.15436444017622206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,5120,0.11870133876800537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,7168,0.13864178127712673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,16384,0.28481777509053546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,5120,0.06454133325152926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,4096,0.0951555569966634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,3584,0.08356266551547581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,4096,0.05533866749869453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,3072,0.07338577508926392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,3584,0.05045066608322991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,6144,0.12332267231411403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,5120,0.10843555794821845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,3072,0.045147554741965405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,2560,0.061738669872283936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,4096,0.093758225440979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,2048,0.0512586666478051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,3584,0.0858151117960612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,2560,0.04067555401060317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,1536,0.04002044598261515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,3072,0.07793600029415555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,1024,0.02830577890078227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,2560,0.09156533082326253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,1536,0.030213332838482324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,768,0.021977777282396953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,2048,0.06657777892218696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,1536,0.05686577823426989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,1024,0.02332177758216858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,1024,0.0494026674164666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,512,0.015444444285498725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,768,0.020491555333137512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,768,0.04297599858707852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,256,0.00941244430012173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,128,0.007656888829337225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,512,0.03753066725201077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,512,0.017837334010336135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,64,0.0068915556702348925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,256,0.01593777702914344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,65536,32,0.006635555376609166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,128,0.027115555273161993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,128,0.014817777607176038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,64,0.016144000821643405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,32,0.01924888955222236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,65536,2048,0.0355751117070516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,65536,0.5502710872226292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,51200,0.8585199779934354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,65536,1.0663440492418077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,51200,0.41933510038587785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,256,0.03189244535234239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,16384,0.28252800305684406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,16384,0.14398933781517878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,12288,0.10995733075671726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,12288,0.21270667182074654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,10240,0.17162933614518908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,65536,51200,0.9005155563354492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,10240,0.0945697757932875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,8192,0.1421413289176093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,8192,0.08054755793677436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,7168,0.12548532750871447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,16384,0.23878399531046549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,7168,0.07005955775578816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,12288,0.18644444147745767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,6144,0.10879466931025188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,10240,0.15935644838545057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,6144,0.06252444452709623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,5120,0.08985510799619888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,8192,0.13443377282884386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,4096,0.07384800248675875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,7168,0.12156711684332953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,5120,0.0542773339483473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,3584,0.06458044714397855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,4096,0.046203556987974376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,6144,0.10893688599268596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,3584,0.042691555288102895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,5120,0.09483822186787923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,3072,0.05759555763668484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,2560,0.04849866694874234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,4096,0.08277866575453016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,3072,0.03826133410135905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,2048,0.039905776580174766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,3584,0.07583822144402398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,3072,0.07015999820497301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,2560,0.06493422057893541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,1536,0.030949334303538006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,2048,0.056927998860677086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,1024,0.02293866707219018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,1536,0.026479111777411565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,1536,0.05066133207745022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,768,0.016791999340057373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,1024,0.02047911120785607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,1024,0.04350489046838549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,512,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,768,0.018600889378123812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,512,0.01662577854262458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,256,0.007963555554548899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,512,0.034635557068718806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,256,0.014289778139856128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,256,0.030636443032158747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,128,0.004876444323195351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,128,0.024791111548741657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,2048,0.030941334035661485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,128,0.013473778135246701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,64,0.0038817777401871155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,51200,32,0.004319111092223061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,51200,0.7226737870110406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,64,0.014492443866199918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,32,0.01690933273898231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,65536,0.34931288825141055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,65536,0.2054177787568834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,51200,0.27379200193617076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,51200,0.15630843904283312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,16384,0.08316355281405978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,65536,0.9581866794162326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,12288,0.0646159980032179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,16384,0.06010933054818047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,10240,0.05353866683112251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,12288,0.049716442823410034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,51200,2560,0.03482310970624288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,16384,0.07460977633794148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,8192,0.04500622219509549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,12288,0.06167111131880018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,7168,0.03854488995340135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,8192,0.03660533494419522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,10240,0.05669422282112969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,7168,0.03266311022970412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,8192,0.051939556996027626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,6144,0.03352355625894334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,5120,0.02904355525970459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,7168,0.04709600077735054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,51200,768,0.03839733203252157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,6144,0.030322667625215318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,4096,0.025039111574490864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,6144,0.04381155636575487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,5120,0.027796443965699937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,3584,0.02151022189193302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,4096,0.024280889166726008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,5120,0.04044444362322489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,4096,0.03772088885307312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,3584,0.022034666604465906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,3072,0.01904711127281189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,3584,0.03559822175237868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,2560,0.016156444946924847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,65536,0.22407200601365831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,2048,0.013307555682129331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,3072,0.020958221620983545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,3072,0.03319999906751845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,1536,0.010797333386209277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,2560,0.03306044472588433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,2048,0.03141333328353034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,10240,0.040935112370385066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,1024,0.008827555510732863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,2560,0.01923111081123352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,1536,0.016527111331621807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,1536,0.029161777761247423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,768,0.007257777783605788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,512,0.005214222189452913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,1024,0.02789688772625393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,1024,0.014712888333532544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,256,0.0038328886859946777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,768,0.024864888853496973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,512,0.01274222218328052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,128,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,256,0.019888889458444383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,256,0.012031111452314587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,64,0.0031999999450312722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,128,0.012411555482281579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,128,0.018346667289733887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,16384,32,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,64,0.011790222591824003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,32,0.012841777669058906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,65536,0.2590542104509142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,65536,0.17756088574727377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,51200,0.17603554990556505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,51200,0.20437333318922254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,2048,0.01833599971400367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,51200,0.13754488362206355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,16384,0.07420977618959215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,16384,768,0.013080000049538083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,16384,0.052770667605929904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,12288,0.053210665782292686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,16384,512,0.022639999787012737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,10240,0.04349155558480156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,12288,0.042113777663972646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,10240,0.03761333227157593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,16384,0.06583378050062391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,8192,0.03669155637423197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,12288,0.05500444438722399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,8192,0.03351199958059523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,7168,0.03014577759636773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,8192,0.045963555574417114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,6144,0.027961777316199407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,51200,0.15026666058434382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,7168,0.04312977857059903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,65536,0.18886221779717338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,6144,0.026944888962639704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,5120,0.024126221736272175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,4096,0.02033955521053738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,6144,0.03923022084765964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,3584,0.01794577803876665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,5120,0.02426133387618595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,5120,0.036999109718534685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,4096,0.02216800053914388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,3072,0.015957333975368075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,4096,0.03507555524508158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,3584,0.020576889316240948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,3584,0.03362755642996894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,2560,0.013966222604115805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,2048,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,3072,0.031574222776624895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,3072,0.019360888335439894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,2560,0.03226844469706217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,2560,0.018357333209779527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,1536,0.009964444571071202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,2048,0.02975289026896159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,2048,0.01717066599263085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,1536,0.028655999236636694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,1536,0.016393777396943834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,768,0.006573333508438534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,1024,0.013800889253616333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,7168,0.03206311000718011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,1024,0.024842666255103216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,512,0.005320000151793162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,768,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,768,0.02334755493534936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,256,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,10240,0.0507297780778673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,128,0.003760888758632872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,512,0.021945777866575453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,512,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,64,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,256,0.020419556233617995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,32,0.0033280000918441345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,256,0.012124444047609964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,12288,128,0.018198221921920776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,128,0.012087999946541257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,64,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,12288,32,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,65536,0.2187031110127767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,51200,0.1720186604393853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,16384,0.06236622068617079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,51200,0.13163288434346518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,12288,0.04291911257637871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,16384,0.05131999982727898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,12288,0.040720889965693154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,12288,1024,0.008045333127180735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,16384,0.06249688731299507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,10240,0.035306665632459856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,8192,0.029872000217437744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,12288,0.0532968905236986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,10240,0.036201778385374285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,8192,0.032279110617107816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,10240,0.04889688889185587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,7168,0.026151999831199646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,51200,0.14326488971710205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,8192,0.044180442889531456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,6144,0.022721777359644573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,65536,0.17705599466959634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,7168,0.0417520006497701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,5120,0.020132443971104093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,6144,0.02650755478276147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,6144,0.038438220818837486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,4096,0.01735822194152408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,65536,0.16608266035715738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,5120,0.023303111394246418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,5120,0.036496887604395546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,3584,0.014677332507239448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,4096,0.0214355554845598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,3072,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,4096,0.03375644485155741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,3584,0.020033778415785897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,3584,0.032495998673968844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,3072,0.0326186650329166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,2048,0.011349333657158745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,2560,0.017883555756674874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,2560,0.031222220924165513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,1536,0.009578666753239101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,2048,0.017419555120997958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,2048,0.029431111282772485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,1024,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,1536,0.015267555912335714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,1536,0.02863022353914049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,768,0.006607111129495833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,1024,0.01370666672786077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,1024,0.02403555479314592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,512,0.004886222382386525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,768,0.013092444174819522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,768,0.02331111166212294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,7168,0.028374221589830186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,256,0.0041893331540955436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,512,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,512,0.02233155568440755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,128,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,256,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,64,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,128,0.018221333622932434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,128,0.012064889073371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,32,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,64,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,10240,2560,0.01276000009642707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,32,0.013119999733236102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,10240,3072,0.01888088881969452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,65536,0.17909244696299234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,51200,0.1406008932325575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,65536,0.11871643861134847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,51200,0.09381333324644302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,16384,0.04951644606060452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,12288,0.03735555542839898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,16384,0.039353777964909874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,16384,0.06131466892030504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,12288,0.03221155537499322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,10240,0.03085955646302965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,12288,0.051869332790374756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,8192,0.02626666592227088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,10240,0.028934223784340754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,51200,0.1400631136364407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,10240,256,0.019575999842749704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,10240,0.04833777745564779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,7168,0.02311022248533037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,8192,0.025358221597141687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,6144,0.02015555567211575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,65536,0.1721928914388021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,8192,0.044181333647833936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,7168,0.02325155503220028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,5120,0.017535999417304993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,7168,0.04141155547565884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,6144,0.021331555313534204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,4096,0.014967999524540372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,6144,0.038155555725097656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,3584,0.013108444710572561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,5120,0.019693333241674636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,5120,0.03628799981541104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,3072,0.011918221910794577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,4096,0.034338666333092585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,4096,0.018024888303544786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,2560,0.010379555324713389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,3584,0.01752355529202355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,3584,0.03239288926124573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,2048,0.008943110704421997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,3072,0.030806223551432293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,3072,0.016905777984195285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,2560,0.016005333926942613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,2048,0.0292577776643965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,2048,0.015096000499195524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,1024,0.005994666781690385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,1536,0.027123555541038513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,1536,0.013807999591032663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,768,0.0047626665068997275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,512,0.004004444513056013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,1024,0.023971555961502924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,1024,0.01272266689274046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,768,0.022983999715911016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,768,0.012471111284361945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,256,0.0035786665976047516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,512,0.012049777640236748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,512,0.020992888344658747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,128,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,256,0.020543111695183646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,256,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,64,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,32,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,128,0.011191999746693505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,128,0.01791111131509145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,64,0.011515555282433828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,8192,32,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,65536,0.1564133299721612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,65536,0.10919111304812962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,51200,0.12492356035444473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,51200,0.08667200141482884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,16384,0.0469760000705719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,8192,1536,0.007928888830873702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,16384,0.03642755415704515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,12288,0.03707733419206407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,8192,2560,0.030623998906877305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,16384,0.06112888786527845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,10240,0.02868088748719957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,12288,0.029834667841593426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,8192,0.024579554796218872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,10240,0.027071999178992376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,12288,0.05156533254517449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,10240,0.04747200012207031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,7168,0.021366222037209406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,51200,0.13828178246816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,65536,0.1716995504167345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,8192,0.023461333579487268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,6144,0.018971555762820773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,8192,0.04309511184692383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,7168,0.02129688858985901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,5120,0.01625688870747884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,7168,0.040720889965693154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,4096,0.014135110709402295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,6144,0.020111999577946134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,6144,0.038104888465669416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,3584,0.012410666379663678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,5120,0.01871466636657715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,5120,0.03569333420859443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,3072,0.011230222052998014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,4096,0.03336355421278212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,3584,0.01716088917520311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,3584,0.032776888873842024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,2560,0.009691555466916826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,2048,0.008897778060701158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,3072,0.031325333648257785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,2560,0.015462223026487561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,2048,0.028657777441872492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,1536,0.0074515557951397365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,2048,0.01443822185198466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,1024,0.005628444254398346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,1536,0.025467554728190105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,1536,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,768,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,1024,0.012445333103338877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,1024,0.023383999864260357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,512,0.0038808890514903595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,768,0.023023999399609033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,768,0.012113778127564324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,256,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,512,0.011746666497654386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,512,0.02126577827665541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,128,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,256,0.011142222417725457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,256,0.01971733404530419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,64,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,128,0.018990221950742934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,7168,32,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,64,0.01107377807299296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,4096,0.017571555243598092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,32,0.011414222419261932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,3072,0.016546666622161865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,7168,2560,0.03118577930662367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,65536,0.10168621937433879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,51200,0.10778577460183038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,16384,0.03908711009555393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,51200,0.08043911059697469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,16384,0.0348293317688836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,12288,0.03165155649185181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,16384,0.060645335250430636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,12288,0.028021332290437486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,65536,0.17071821954515246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,51200,0.13796444733937582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,10240,0.02737599942419264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,12288,0.05145244465933906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,8192,0.022843556271659002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,7168,128,0.011083555718262991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,10240,0.025352888637118872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,7168,0.020573332905769348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,10240,0.04754933383729723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,8192,0.022338666849666174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,6144,0.015498666299713982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,7168,0.02057422200838725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,7168,0.040082666609022356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,65536,0.1349831157260471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,5120,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,6144,0.019388443893856473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,6144,0.03684711125161912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,4096,0.011952888634469775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,5120,0.018191110756662156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,5120,0.035657776726616755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,3584,0.010653333531485664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,4096,0.016719111137919955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,4096,0.03384800089730157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,3072,0.009892444643709395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,3584,0.0162444445821974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,3584,0.03172533379660712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,2560,0.008621333373917473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,3072,0.01629066632853614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,2048,0.007679999702506595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,2560,0.015000889698664347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,2560,0.03062844607565138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,1536,0.006245333287451003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,2048,0.013458666702111563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,2048,0.028419554233551025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,1024,0.004642666627963384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,1536,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,1536,0.02605244517326355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,768,0.004202666795916027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,1024,0.012448000411192576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,512,0.0035413333939181436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,768,0.012437333663304647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,8192,0.042509333954917065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,256,0.003277333246337043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,512,0.021967111362351313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,256,0.011401777466138205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,128,0.0032026666320032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,256,0.02104266650146908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,128,0.0195795562532213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,128,0.011076444553004371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,64,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,6144,32,0.003068444422549672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,3072,0.03047555685043335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,64,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,65536,0.11565689245859782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,32,0.01202755586968528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,51200,0.09205510881212021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,65536,0.09525155358844334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,51200,0.07380711370044284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,16384,0.035242666800816856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,1024,0.023525334066814844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,16384,0.03234400020705329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,12288,0.027621333797772724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,16384,0.059748444292280406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,6144,768,0.0229751103454166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,10240,0.02368800010946062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,12288,0.025752888785468206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,6144,512,0.012081777883900536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,12288,0.05062133404943678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,65536,0.169995559586419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,10240,0.02310133311483595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,51200,0.13714667161305746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,7168,0.018192888961897958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,10240,0.046669334173202515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,6144,0.016826666063732572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,8192,0.04211733407444424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,8192,0.02126844392882453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,7168,0.019816888703240287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,5120,0.014114666316244336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,7168,0.0403457780679067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,4096,0.012699555191728802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,6144,0.03811555438571506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,5120,0.01756622228357527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,5120,0.03558844327926636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,4096,0.032842665910720825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,4096,0.0166275550921758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,3072,0.010425777898894416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,3584,0.03162755568822225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,2560,0.008799999952316284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,3072,0.030051555898454454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,2560,0.013741333451535968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,2560,0.030264000097910564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,2048,0.007711110843552484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,2048,0.013440888788965015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,2048,0.026737777723206416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,1536,0.006171555568774541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,1536,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,1536,0.02474133339193132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,1024,0.004583111239804162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,8192,0.019916445016860962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,768,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,1024,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,6144,0.018532445033391316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,768,0.02295111119747162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,512,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,3584,0.01109155515829722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,256,0.0032044444233179092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,512,0.021943999661339655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,3584,0.016207999653286405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,256,0.01186044431395001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,128,0.002883555574549569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,256,0.020230222079488967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,3072,0.014819555812411837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,64,0.003142222141226133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,128,0.01924000018172794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,128,0.011748444702890186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,5120,32,0.003010666618744532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,64,0.011038222246699862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,65536,0.09195999966727363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,32,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,51200,0.0732133322291904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,65536,0.08626755740907456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,51200,0.0706862211227417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,5120,1024,0.023431999815834895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,16384,0.028733332951863606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,768,0.012075555821259817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,16384,0.02997244397799174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,12288,0.022787556052207947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,65536,0.16915288236406115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,51200,0.13728266292148167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,10240,0.019951999187469482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,5120,512,0.011941333611806234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,16384,0.06051644351747301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,12288,0.02419288953145345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,8192,0.0174319992462794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,12288,0.0510168903403812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,7168,0.015786666009161208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,10240,0.021592888567182753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,8192,0.02058844433890449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,6144,0.014016888207859464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,8192,0.041913777589797974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,7168,0.018883556127548218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,7168,0.03979644510481093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,6144,0.03598755598068237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,4096,0.0105253333846728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,5120,0.035255998373031616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,5120,0.01702222228050232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,3584,0.008960000342792934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,4096,0.03244888782501221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,3584,0.01477777792347802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,3072,0.008257778154479133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,3584,0.03139822350607978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,3072,0.02810133496920268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,3072,0.014135999812020196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,2560,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,2560,0.013396444420019785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,2048,0.006287999865081575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,2048,0.013060444758998023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,10240,0.046915554338031344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,1536,0.00527022240890397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,2048,0.026762665973769292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,5120,0.011067555182509951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,1024,0.00424799985355801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,6144,0.018200889229774475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,1536,0.0127368892232577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,1536,0.026036444637510512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,768,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,1024,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,1024,0.024057777391539678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,512,0.003685333248641756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,4096,0.015413333972295126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,768,0.023638221952650283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,768,0.012082666986518435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,256,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,128,0.0031022222505675424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,512,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,512,0.020989333589871723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,256,0.020756444997257657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,64,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,256,0.011375111010339526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,4096,32,0.002879111096262932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,128,0.011071999867757162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,128,0.01990133358372582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,64,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,65536,0.0792906681696574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,4096,32,0.012090666426552666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,51200,0.0633760028415256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,16384,0.025217778152889673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,65536,0.08602755599551731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,4096,2560,0.028083556228213843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,12288,0.019949333535300363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,51200,0.06648088826073541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,16384,0.02755644420782725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,10240,0.017553778158293832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,16384,0.05948533614476522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,12288,0.023471999499532912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,8192,0.015352000792821249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,12288,0.0506568882200453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,10240,0.021191999316215515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,10240,0.046345776981777616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,65536,0.16890845033857557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,51200,0.1377626657485962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,6144,0.013099555340078143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,8192,0.019952888290087383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,8192,0.04211022125350105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,5120,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,7168,0.01852799952030182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,7168,0.03969600134425693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,6144,0.01756977703836229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,4096,0.009944000177913243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,6144,0.036100443866517805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,3584,0.008642666869693333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,5120,0.016889777448442247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,5120,0.03520355621973673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,3072,0.00797333319981893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,4096,0.032459557056427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,3584,0.03058755397796631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,3584,0.014160000615649752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,2560,0.0068959999415609576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,3072,0.013759111364682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,3072,0.028629332780838013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,2048,0.0059262220230367445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,2560,0.013411555853154926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,2560,0.027740443746248882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,1536,0.005260444349712796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,2048,0.012776888906955719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,2048,0.026280000805854797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,1024,0.004226666771703296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,1536,0.01277955538696713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,1536,0.025019556283950806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,768,0.003653333418899112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,1024,0.012144000165992312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,1024,0.0233324451578988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,512,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,768,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,256,0.0032337777730491427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,512,0.021108445194032457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,512,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,128,0.00300177786913183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,7168,0.014073777529928418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,256,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,256,0.0196142229768965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,64,0.0028862222615215513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3584,32,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,128,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,128,0.019222221440739103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,64,0.01069777790043089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,65536,0.06946755780114068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,32,0.010701333483060202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3584,4096,0.015119999647140503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,51200,0.05574933025572035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,65536,0.08354222112231785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,16384,0.02113866640461816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,51200,0.06674844688839383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,16384,0.02693333393997616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,16384,0.059895998901791044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,12288,0.022616000639067754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,51200,0.13721156120300293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,10240,0.015618667006492615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,12288,0.050385776493284434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,8192,0.01352355546421475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,10240,0.02086666723092397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3584,768,0.022996443841192458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,7168,0.012936000194814471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,8192,0.01965777741538154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,8192,0.04162222146987915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,6144,0.012073777616024017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,7168,0.01846844454606374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,7168,0.040158222119013466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,5120,0.01033866653839747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,6144,0.017157332764731515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,6144,0.037343111303117536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,4096,0.009457777771684859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,5120,0.01677955521477593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,5120,0.03535822365019057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,3584,0.008425777984990014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,4096,0.015272888872358533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,4096,0.03122133347723219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,3072,0.00759733302725686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,3584,0.014485332700941296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,12288,0.018017777138286166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,3584,0.03228088882234361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,2560,0.007044444481531779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,3072,0.014096889230940076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,3072,0.027792887555228338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,2048,0.006241777704821692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,2560,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,65536,0.16848356193966338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,2560,0.027064889669418335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,1536,0.005219555563396878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,1024,0.0039048890272776284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,2048,0.02720355490843455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,2048,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,768,0.003628444340493944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,1536,0.012422222230169507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,10240,0.04619288775655958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,1024,0.023969777756267126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,1024,0.012288000020715924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,512,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,256,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,768,0.02274399995803833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,768,0.011764444410800934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,128,0.0029200000895394217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,512,0.022613333331214056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,512,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,64,0.0026008888251251644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,256,0.011145778000354767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,3072,32,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,128,0.011143999795118967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,64,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,65536,0.05940000216166178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,3072,32,0.011046222514576383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,51200,0.04751733276579115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,65536,0.08141333527035184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,51200,0.064538664287991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,16384,0.019592000378502738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,65536,0.16893777582380506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,51200,0.13759556081559923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,16384,0.025967111190160114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,12288,0.016972444123691983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,16384,0.05888444185256958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,1536,0.024703111913469102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,10240,0.014818666709793938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,12288,0.05027733246485392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,10240,0.04593244526121351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,10240,0.020630222227838304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,8192,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,7168,0.012255111502276527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,256,0.019546666079097323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,8192,0.04173422190878126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,3072,128,0.019689778486887615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,6144,0.01108888867828581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,7168,0.018239999810854595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,7168,0.039447112215889826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,5120,0.010032888915803697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,6144,0.017107556263605755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,6144,0.03601333167817857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,4096,0.009014222357008193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,5120,0.03457511133617825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,5120,0.015526221858130561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,3584,0.008277333445019191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,4096,0.03148444493611654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,4096,0.01479466590616438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,3072,0.007344000041484833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,3584,0.029498666524887085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,2560,0.006748444504208035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,3072,0.029110223054885864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,3072,0.013491555220550962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,2048,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,2560,0.027405333187845018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,2560,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,1536,0.0047866664826869965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,2048,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,2048,0.02642311155796051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,12288,0.022117333279715642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,1024,0.0041884444653987885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,1536,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,768,0.003548444559176763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,1024,0.023686221904224817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,1024,0.012099555797047086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,512,0.003536888708670934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,768,0.01204533295498954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,8192,0.01899111105336083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,256,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,768,0.023021333747439917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,512,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,128,0.002850666642189026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,256,0.020968000094095867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,256,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,64,0.0026488889836602737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,128,0.019554666346973844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,128,0.011058666639857821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2560,32,0.0028106667515304354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,64,0.010856000085671743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,65536,0.048727999130884804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,3584,0.013805333111021252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2560,32,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,51200,0.03882666760020786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,65536,0.07808266745673285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,16384,0.017200888858901132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,51200,0.06263999806510077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,65536,0.16854133870866564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,16384,0.025702221526039973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,16384,0.058607108063168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,51200,0.1374382177988688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,1536,0.024724443753560383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,12288,0.01497333414024777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,10240,0.013785777820481194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,8192,0.01275022245115704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,12288,0.021617778473430212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,10240,0.020232889387342665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,7168,0.01201777739657296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,8192,0.018251554833518136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,8192,0.04145244426197476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,6144,0.010935111178292168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2560,512,0.021958221991856892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,5120,0.010176888770527309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,7168,0.03843377696143256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,6144,0.016528889536857605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,6144,0.036828445063696966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,4096,0.008425777984990014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,5120,0.03382844395107693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,5120,0.015485333071814643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,3584,0.007715555528799693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,4096,0.014485332700941296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,3072,0.00701155596309238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,3584,0.014098667436175875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,3072,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,3072,0.028132445282406274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,2560,0.006247111078765657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,2560,0.028452446063359577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,2048,0.005229333208666907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,12288,0.04957955413394504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,2048,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,10240,0.0458497769302792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,1536,0.004854222138722737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,2048,0.027090667022599116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,1536,0.012720000412729053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,1536,0.02539199921819899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,1024,0.0041582224269707995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,1024,0.023680888944202002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,1024,0.01240799989965227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,768,0.0036728887094391715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,4096,0.030481778913074072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,512,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,3584,0.029042667812771265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,768,0.023285332653257582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,256,0.0029964444951878656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,512,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,512,0.021086222595638696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,128,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,256,0.01168444421556261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,256,0.019666666785875957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,2560,0.013345777988433838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,64,0.0026462222966882917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,128,0.01107911103301578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,2048,128,0.01962222158908844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,65536,0.037017779217825994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,64,0.011378666592968835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,32,0.011262222296661802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,51200,0.03067644437154134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,65536,0.0735608869128757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,7168,0.01753777762254079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,65536,0.16928888691796196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,16384,0.015339555011855232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,51200,0.1377262274424235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,16384,0.025428444147109985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,16384,0.05828444163004557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,12288,0.01308444473478529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,10240,0.013055110971132914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,2048,768,0.012123555772834353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,12288,0.049582223097483315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,12288,0.021906667285495337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,8192,0.012278222375445895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,10240,0.019677332705921598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,10240,0.04632088873121473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,7168,0.011003555523024665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,8192,0.01739555597305298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,8192,0.04037244452370538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,6144,0.010337777435779572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,7168,0.038541333542929754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,7168,0.016895999511082966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,2048,32,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,5120,0.009949333137936061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,6144,0.0355422231886122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,4096,0.00905955582857132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,5120,0.01566755606068505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,3584,0.007286222444640265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,4096,0.03117777903874715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,4096,0.014195554786258273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,3072,0.007119999991522894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,3584,0.030078222354253132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,3584,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,2560,0.006204444501135085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,51200,0.06086755461162991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,3072,0.01370666672786077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,3072,0.02808711263868544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,2048,0.005260444349712796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,1536,0.004608889006906086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,2560,0.027408889598316614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,2560,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,1024,0.0039057777159743835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,2048,0.012792000340090858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,2048,0.02572444412443373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,768,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,1536,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,1536,0.026092444856961567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,512,0.0031519999934567344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,1024,0.024345777100986902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,1024,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,256,0.00319377767542998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,768,0.011894221935007306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,512,0.021653332644038733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,128,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,256,0.020227554771635268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,256,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,64,0.0028844444702068963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,128,0.018882667024930317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,128,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1536,32,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,6144,0.015565334094895257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,65536,0.02642400066057841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,32,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,51200,0.024725332856178284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,65536,0.07266666491826375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,65536,0.1695093313852946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,51200,0.05704710880915324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,16384,0.012430222498046027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,51200,0.13707555664910212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,12288,0.012260444462299347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,16384,0.05848889218436348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,16384,0.025034666061401367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,10240,0.010999999940395355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,12288,0.020231111182106864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,12288,0.04890133274926079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,768,0.022681777675946552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,8192,0.01000355515215132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,512,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,10240,0.04458666510052151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,10240,0.018312000566058688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,7168,0.009375111096435124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,8192,0.03990666733847724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,6144,0.008800889054934183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,7168,0.0376506679587894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1536,64,0.011124444504578909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,5120,0.008959111240175035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,6144,0.015480000111791821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,6144,0.033837334977255926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1536,5120,0.033386667569478355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,4096,0.007616000043021307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,5120,0.01520088811715444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,5120,0.032495998673968844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,3584,0.006940444310506185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,4096,0.030533333619435627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,3072,0.006228444476922353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,3584,0.013811555173661975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,3584,0.029662221670150757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,2560,0.0059004442559348206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,3072,0.013396444420019785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,3072,0.028781334559122723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,2048,0.0052177777720822235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,2560,0.013367111484209696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,2560,0.026408889227443274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,1536,0.004593777573770947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,2048,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,2048,0.027165333429972332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,1024,0.00388711111413108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,1536,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,1536,0.025958221819665697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,768,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,1024,0.012447111308574677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,8192,0.01683555543422699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,512,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,7168,0.016155555844306946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,768,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,768,0.023617777559492324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,256,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,512,0.021560000048743352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,512,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,128,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,256,0.020907556017239887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,256,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,64,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,1024,32,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,128,0.018231110440360177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,128,0.011032889286677042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,4096,0.014087110757827759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,65536,0.025403555896547105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,64,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,51200,0.02106399999724494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,1024,32,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,65536,0.06884977552625868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,51200,0.055863108899858266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,65536,0.16889333724975586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,51200,0.13645688692728677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,12288,0.010508444574144153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,16384,0.023875556058353845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,10240,0.010072888599501716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,16384,0.05837955739763048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,12288,0.019895111521085102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,12288,0.048244443204667836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,8192,0.009375111096435124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,10240,0.017903111047214933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,10240,0.045399109522501625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,7168,0.008631111019187504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,6144,0.008281778130266402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,8192,0.03901777664820353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,1024,1024,0.023342221975326538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,5120,0.008330666356616551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,7168,0.016840888394249808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,7168,0.03701511025428772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,4096,0.007469333708286285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,6144,0.03337422344419692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,6144,0.015508444772826301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,3584,0.00703288863102595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,5120,0.033583111233181424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,5120,0.014596444037225513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,3072,0.006281777802440856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,4096,0.013754666679435305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,4096,0.030469334787792627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,2560,0.005592000153329637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,3584,0.013768889009952545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,3072,0.027414222558339436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,3072,0.013183111117945777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,2048,0.004881777697139316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,2560,0.013064000341627332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,1536,0.004535111288229625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,2048,0.012717333104875354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,2048,0.02605688903066847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,1024,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,1536,0.01237777786122428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,1536,0.024738666084077623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,768,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,1024,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,1024,0.022683555881182354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,768,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,768,0.02199555602338579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,512,0.0032337777730491427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,8192,0.016895999511082966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,256,0.0028897778441508612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,512,0.02092355489730835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,256,0.011384888655609555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,128,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,3584,0.029482665989134047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,128,0.011086222198274402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,64,0.00254844439526399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,128,0.01959111127588484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,2560,0.02720355490843455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,32,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,64,0.010693333215183683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,768,16384,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,32,0.01107377807299296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,51200,0.018336888816621568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,65536,0.06799911128150092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,65536,0.16814933882819283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,16384,0.01071466671095954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,51200,0.05551111035876804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,51200,0.13638667265574136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,12288,0.008868444297048781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,16384,0.023289778166347083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,16384,0.056813332769605845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,10240,0.009308444129096137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,768,512,0.011431111229790581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,12288,0.019550222489568923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,12288,0.04755289024776883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,8192,0.008309333688682979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,10240,0.018183110488785636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,768,256,0.01939022209909227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,10240,0.043394668234719165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,7168,0.007990222010347579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,6144,0.008619555168681675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,8192,0.01701244380739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,8192,0.03901777664820353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,7168,0.03669955664210849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,7168,0.015847999188635085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,6144,0.015108444624476962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,6144,0.03472800056139628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,4096,0.007312888900438945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,5120,0.032165331972969904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,5120,0.014486221803559197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,3584,0.006979555719428592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,65536,0.02168888847033183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,4096,0.029839111698998347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,3072,0.006884444504976273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,3584,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,2560,0.0058808889653947614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,3072,0.013166222307417126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,3072,0.02828888760672675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,2048,0.004893333133724001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,2560,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,2560,0.027106665902667578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,1536,0.004522666749027041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,2048,0.012832000023788877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,2048,0.025085333320829604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,1024,0.0038613333470291565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,1536,0.012362666428089142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,1536,0.025389333566029865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,768,0.0035982223020659555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,1024,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,1024,0.023333332604832117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,512,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,768,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,768,0.022298667165968154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,256,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,5120,0.007987555530336168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,512,0.011439111497667102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,512,0.022200889057583276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,128,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,256,0.019274666905403137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,256,0.011077333655622272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,64,0.002510222295920054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,512,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,128,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,65536,0.01519466605451372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,4096,0.014146667387750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,51200,0.013732444081041547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,3584,0.028480887413024902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,32,0.011014222270912595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,16384,0.009718221922715506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,65536,0.066557334529029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,65536,0.1673848893907335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,51200,0.05388444330957201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,12288,0.01000711073478063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,51200,0.1357768906487359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,16384,0.022689777943823073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,16384,0.056382218996683754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,10240,0.008970666262838576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,8192,0.008283555507659912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,12288,0.04686489038997226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,12288,0.01992266707950168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,7168,0.00794933322403166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,10240,0.04363644454214308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,10240,0.018208000395033095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,8192,0.01647733317481147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,8192,0.03868088788456387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,6144,0.0073831114504072405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,7168,0.03766311208407084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,7168,0.016196444630622864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,5120,0.0069724445541699724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,6144,0.015145777000321282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,6144,0.033944000800450645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,4096,0.006813333266311222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,5120,0.014752000570297241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,5120,0.03356711069742838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,3584,0.006384000182151794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,4096,0.013764444324705334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,4096,0.030159112479951646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,3072,0.006646222124497096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,3584,0.014108444253603617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,512,128,0.01789066692193349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,2560,0.006616888774765863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,3072,0.013080889152155982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,3072,0.027388445205158655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,2048,0.006024888820118374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,512,64,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,2560,0.02847111225128174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,2560,0.012827555338541666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,1536,0.004519999855094486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,1024,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,2048,0.025360888904995386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,2048,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,768,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,1536,0.024485333098305598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,1024,0.022642667094866436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,1024,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,512,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,768,0.022664000590642292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,256,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,512,0.012088889049159156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,512,0.021329777108298406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,128,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,256,0.01109333336353302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,256,0.020609777834680345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,64,0.002550222186578645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,128,0.01072533345884747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,256,32,0.002489777695801523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,64,0.011208000282446543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,65536,0.01514488955338796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,32,0.010399999717871347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,3584,0.029820445511076186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,51200,0.014781332678265043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,65536,0.06360177861319648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,65536,0.16724622249603271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,16384,0.008977777428097194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,51200,0.051111999485227794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,51200,0.13543200492858887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,12288,0.00793688909875022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,16384,0.02274133265018463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,1536,0.012748444245921241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,16384,0.0557733310593499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,10240,0.007283555964628856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,12288,0.04688533478313022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,12288,0.019898666275872123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,8192,0.007269333634111617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,10240,0.0439226660463545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,10240,0.018200000127156574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,7168,0.006677333265542984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,8192,0.016882666283183627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,8192,0.038711110750834145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,6144,0.006288888967699475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,7168,0.03738222188419766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,5120,0.006270222365856171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,256,128,0.017856000198258292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,6144,0.015101333459218344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,6144,0.035038222869237266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,4096,0.006236444330877728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,5120,0.015139554937680563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,5120,0.03228444523281521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,3584,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,4096,0.014110222458839417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,3072,0.006029333505365584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,3584,0.013423110875818463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,3584,0.029489778810077246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,2560,0.006322666588756774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,3072,0.013447999954223633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,3072,0.027447111076778833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,2048,0.005598222215970357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,2560,0.013445333474212222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,2560,0.028096887800428603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,1536,0.004521777646409141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,2048,0.01240799989965227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,2048,0.027101332942644756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,1024,0.0038746665749284956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,256,768,0.011492444409264458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,1536,0.01256533298227522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,768,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,1024,0.02437155610985226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,1024,0.011769777370823754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,512,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,768,0.02257777750492096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,256,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,7168,0.0162453336848153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,512,0.022092445029152766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,512,0.011386666860845355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,128,0.0025315555847353404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,256,0.020978666014141504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,256,0.01092355532778634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,64,0.002485333424475458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,128,0.01072533345884747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,128,0.019542222221692402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,128,32,0.002485333424475458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,65536,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,4096,0.030477331744299993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,51200,0.01091466678513421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,32,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,16384,0.008285333712895712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,65536,0.06334577666388617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,12288,0.007601777712504069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,51200,0.05113244387838575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,10240,0.007072889142566257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,16384,0.02299022177855174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,8192,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,12288,0.01959288948112064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,7168,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,8192,0.01687111126052009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,48,128,1536,0.024401777320437964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,7168,0.016030222177505493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,5120,0.005946666830115848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,768,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,6144,0.01515111161602868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,4096,0.00591111100382275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,3584,0.00630666646692488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,5120,0.014502222339312235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,3072,0.005596444424655702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,4096,0.013753777576817406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,3584,0.01408622165520986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,3072,0.01313244468635983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,2048,0.005566222386227713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,128,64,0.010354667074150508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,2560,0.01312622262371911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,1536,0.00453333349691497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,1024,0.0035422220826148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,2048,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,1536,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,1024,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,512,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,768,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,256,0.00299822228650252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,512,0.01143200033240848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,10240,0.017893332574102614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,128,0.0025253333151340485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,64,0.002465777720014254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,256,0.011423110961914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,6144,0.006618666566080517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,32,0.002526222210791376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,128,0.010682666467295753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,65536,0.012083555261294046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,64,0.010321777727868822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,51200,0.011085333095656501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,16384,0.007990222010347579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,65536,0.06281599733564588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,51200,0.05043111244837443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,12288,0.0069360000391801195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,16384,0.02325511144267188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,10240,0.006912888752089606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,2560,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,8192,0.0064204442832205035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,7168,0.006256888724035687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,12288,0.01956977778010898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,10240,0.018200000127156574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,6144,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,8192,0.01647822227742937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,5120,0.005943999936183293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,7168,0.015790222419632804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,4096,0.00565422202150027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,3584,0.005572444448868434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,6144,0.015459555718633862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,64,768,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,5120,0.014474666780895658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,2560,0.005881777654091517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,4096,0.013747555514176687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,3584,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,2048,0.005559999909665849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,1536,0.004511111312442356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,3072,0.013192888763215808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,1024,0.003863111138343811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,2560,0.012890666723251343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,768,0.003491555651028951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,2048,0.01275199982855055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,1536,0.012062222593360476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,1024,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,256,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,512,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,128,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,64,32,0.011367110742463006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,256,0.010704889065689512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,64,0.002513777878549364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,32,0.002481777841846148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,128,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,64,0.010404444403118556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,32,0.011331555744012197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,16384,0.17553777164883086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,16384,0.3679537773132324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,51200,0.510117318895128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,12288,0.2719155682457818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,512,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,48,32,768,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,12288,0.13215466340382895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,10240,0.2288222312927246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,10240,0.1132791174782647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,51200,1.1211840311686199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,8192,0.18556622664133707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,8192,0.09706755479176839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,7168,0.1615333292219374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,7168,0.08358310990863377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,5120,0.11715377701653375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,6144,0.07438221904966566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,3584,0.0844693316353692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,4096,0.09539022048314412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,6144,0.13810400168100992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,48,32,3072,0.005967111223273807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,5120,0.06413777669270833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,4096,0.05457866523000929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,3072,0.07236266798443265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,2560,0.06077422036064995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,3584,0.05720444520314535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,2048,0.05066133207745022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,1536,0.03889333208401998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,3072,0.05140799946255154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,2560,0.04537777768241035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,768,0.021292444732454088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,1536,0.031713777118259005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,2048,0.03986666599909464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,512,0.014767999450365702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,1024,0.025934222671720717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,768,0.02139555580086178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,256,0.00927022182279163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,128,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,64,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,512,0.01891288823551602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,32,0.006919999917348226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,256,0.01549600064754486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,128,0.014489778214030795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,64,0.016532444291644625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,65536,32,0.01590488851070404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,16384,0.271488004260593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,65536,0.5406977865431044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,51200,0.41200889481438535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,16384,0.14214221636454263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,12288,0.20400088363223604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,12288,0.10857511228985256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,51200,0.8469333118862576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,10240,0.1716853380203247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,65536,1.0761537551879883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,8192,0.13877511024475098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,10240,0.09311022361119588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,7168,0.12334933545854355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,5120,0.08910044696595933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,6144,0.06230488750669691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,8192,0.08006578021579318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,3584,0.06422577963935004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,5120,0.0536444452073839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,4096,0.04607999987072415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,3072,0.056495110193888344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,3584,0.0484497778945499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,2560,0.04692622356944614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,3072,0.044191999567879565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,2048,0.03751111030578613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,1536,0.0302782224284278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,2560,0.03865866528617011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,2048,0.033928887711630926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,1024,0.02195288903183407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,65536,1024,0.028885334730148315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,768,0.01638488968213399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,512,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,1536,0.027448000179396734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,256,0.007684444387753804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,1024,0.021839110387696162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,128,0.004886222382386525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,512,0.017147555947303772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,64,0.004159111115667555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,256,0.014002665877342224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,32,0.0041857775714662345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,768,0.01960355540116628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,6144,0.10513422224256729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,32,0.0147706667582194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,51200,4096,0.07289066579606798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,7168,0.06948444578382704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,65536,0.36397955152723527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,16384,0.08039822181065877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,65536,0.20171822441948783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,51200,0.286007112926907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,12288,0.06186222367816501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,51200,0.1505137814415826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,10240,0.05177066723505656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,16384,0.058212445841895215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,8192,0.044403556320402354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,12288,0.04593422346644931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,7168,0.03763466742303636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,10240,0.040383110443751015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,6144,0.032615999380747475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,5120,0.02852977646721734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,8192,0.03592177894380357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,6144,0.030299554268519085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,4096,0.02442755632930332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,3584,0.021124444074100916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,7168,0.03287022312482198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,4096,0.023201778531074524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,3072,0.018589332699775696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,64,0.0151235560576121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,5120,0.027441778116756018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,3072,0.022656889425383672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,2048,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,1536,0.010958222051461538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,2560,0.021427555216683283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,1024,0.008621333373917473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,2048,0.019016888406541612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,768,0.007266666326257918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,1024,0.015569777952300178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,512,0.0052133335007561584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,768,0.014096889230940076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,256,0.003664888855483797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,512,0.013088000317414602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,128,0.0032764443506797156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,256,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,64,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,128,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,32,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,64,0.011782222323947482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,51200,128,0.013889777991506787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,32,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,16384,2560,0.015836444165971544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,3584,0.025506666964954797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,65536,0.2666204505496555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,16384,0.07423200209935506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,65536,0.17193955845303008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,51200,0.21006222565968832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,12288,0.05843200286229452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,51200,0.1321235497792562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,8192,0.038689778910742864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,16384,0.0517448882261912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,7168,0.03295644455485874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,8192,0.03365866674317254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,6144,0.028864890336990356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,5120,0.025083555115593806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,6144,0.02734222180313534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,4096,0.021566222111384075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,4096,0.021560889151361253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,3584,0.018558222386572096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,3584,0.02271911170747545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,3072,0.016153777639071148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,10240,0.04508799976772732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,3072,0.02129688858985901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,2560,0.01382844481203291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,16384,1536,0.017528888252046373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,2048,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,1536,0.010144000252087912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,2560,0.01977777812216017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,10240,0.03696622120009528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,1024,0.00814133303032981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,7168,0.02966844373279148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,768,0.006786666810512543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,1536,0.016775111357371014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,512,0.005041777673694822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,256,0.0041599998043643106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,1024,0.014146667387750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,768,0.013760888742076026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,512,0.012759110993809171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,5120,0.023504889673656885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,64,0.0031822222388452957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,256,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,32,0.0033653332955307434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,128,0.011692444483439127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,64,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,32,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,65536,0.23229598999023438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,65536,0.15956532955169678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,51200,0.18359911441802979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,16384,0.06036444505055746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,51200,0.12651111019982234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,12288,0.048439999421437584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,10240,0.0409804450141059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,12288,0.04022399915589227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,8192,0.029948443174362183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,10240,0.03564800156487359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,12288,0.04117777612474229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,7168,0.03066666589842902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,6144,0.026714666022194758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,5120,0.02295644415749444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,8192,0.03220977716975742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,7168,0.02882044514020284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,12288,2048,0.018114666144053142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,6144,0.02588355541229248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,4096,0.019694222344292533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,3584,0.017165333032608032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,3072,0.015430221954981485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,5120,0.022967111733224656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,12288,128,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,4096,0.020921778347757127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,3584,0.021635555558734473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,2048,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,2560,0.018173333671357896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,1024,0.0079644446571668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,2048,0.017166222135225933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,1536,0.01579466627703773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,768,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,1024,0.01351377781894472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,512,0.00488711107108328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,768,0.013432000246312885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,256,0.003911111089918348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,512,0.012503999802801343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,128,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,16384,0.04988000128004286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,64,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,128,0.01107022249036365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,32,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,64,0.011428444749779172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,32,0.011434666812419891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,65536,0.1786471075481839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,2560,0.013222222526868185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,3072,0.01994400057527754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,65536,0.1127306620279948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,51200,0.14120177427927652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,16384,0.04800711075464884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,51200,0.08814489179187351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,16384,0.03788355655140347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,12288,0.03765155540572272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,8192,0.026346666945351496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,10240,0.030618667602539062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,7168,0.02260622216595544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,10240,0.027809778849283855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,8192,0.024234667420387268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,10240,256,0.012087110843923358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,6144,0.02070577773782942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,5120,0.019048889478047688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,4096,0.014926221635606555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,3584,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,4096,0.017828444639841717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,3072,0.011735111474990845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,10240,1536,0.009672000176376766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,3584,0.018541332748201158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,2560,0.010407999985747868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,2048,0.00869955536392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,3072,0.017616000440385606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,1536,0.007825777762466008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,2560,0.016581333345837064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,1024,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,2048,0.015787555111779105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,768,0.004549333204825719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,1024,0.012841777669058906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,512,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,768,0.01310488912794325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,256,0.0035751110149754416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,7168,0.022036444809701707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,512,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,128,0.0028897778441508612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,5120,0.017147555947303772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,64,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,256,0.012101333174440594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,32,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,128,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,64,0.011039999624093374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,32,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,65536,0.1598400010002984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,51200,0.125763561990526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,16384,0.044885334041383534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,65536,0.10418666733635797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,12288,0.035615109735065036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,51200,0.08199199703004625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,16384,0.03613600134849548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,12288,0.029134223858515423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,8192,0.024313777685165405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,10240,0.02628266645802392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,7168,0.02124799953566657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,6144,0.018815999229749043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,8192,0.023334221707450017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,12288,0.03126755687925551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,8192,1536,0.014203555054134794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,7168,0.021299555897712708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,4096,0.014126222994592456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,6144,0.019902222686343722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,3584,0.012465777496496836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,8192,6144,0.019991111424234178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,5120,0.018526222970750596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,3072,0.011334222224023608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,4096,0.017550221747822232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,2560,0.00980444418059455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,3584,0.018236445056067575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,1536,0.007302222152551015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,3072,0.016805332567956712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,1024,0.005607999861240387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,2048,0.014831999937693277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,768,0.004544888933499654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,1536,0.013800000150998434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,512,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,1024,0.012797333300113678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,256,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,768,0.013059555656380124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,128,0.003152888889114062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,512,0.012161778079138862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,256,0.011355555719799466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,32,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,128,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,64,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,10240,0.03057510985268487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,32,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,65536,0.13753067122565374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,51200,0.09759022129906549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,5120,0.016283555163277518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,65536,0.09729244311650594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,16384,0.037181334363089666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,12288,0.030452443493737116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,10240,0.026639110512203638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,51200,0.07491288582483928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,16384,0.03325422273741828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,7168,2048,0.008642666869693333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,8192,0.022329777479171753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,12288,0.02734666731622484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,7168,0.020310221446885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,7168,2560,0.016201777590645682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,6144,0.018409777018758986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,10240,0.02404444416364034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,8192,0.021513778302404616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,7168,0.020226667324701946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,3584,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,6144,0.019466666711701285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,5120,0.017857778403494094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,3072,0.010696888797812991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,4096,0.01681777834892273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,2560,0.009321778184837764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,2048,0.008344888687133789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,3584,0.01756000022093455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,3072,0.016380444169044495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,1536,0.006897777732875612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,2560,0.015096889601813423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,1024,0.004878222114510006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,768,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,2048,0.014139556222491793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,512,0.0035786665976047516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,1536,0.013737777868906656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,1024,0.012710221939616732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,256,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,768,0.012753778033786349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,128,0.002983111060327954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,64,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,512,0.01242844429281023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,256,0.011361777782440186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,128,0.01073333372672399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,64,0.01200799975130293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,6144,32,0.01072266697883606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,65536,0.11629333761003281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,51200,0.08539733621809219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,65536,0.0881226658821106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,16384,0.03359377715322707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,51200,0.06919466786914401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,12288,0.027099554737408955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,5120,0.016182222300105624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,4096,0.012712000144852532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,16384,0.031120889716678198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,8192,0.01925511161486308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,7168,0.017500445246696472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,12288,0.024325332707828943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,6144,0.015568888849682279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,8192,0.02083200050724877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,5120,0.015511999527613321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,7168,0.01959022217326694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,4096,0.012337778177526263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,3584,0.01072622256146537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,5120,0.017322666115230985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,4096,0.016506666938463848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,3072,0.00997155573632982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,2560,0.008629333641793992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,3072,0.015455999308162265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,2048,0.00792622235086229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,6144,32,0.002847111059559716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,2560,0.014563555518786112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,1536,0.005576888720194499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,1024,0.004567111117972268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,2048,0.013788444300492605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,1536,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,768,0.0041751112374994485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,512,0.0035297779573334586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,1024,0.012748444245921241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,256,0.003530666646030214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,768,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,512,0.0120000003112687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,256,0.012118221984969245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,10240,0.022514666120211285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,128,0.011400889191362592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,32,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,10240,0.0222053329149882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,64,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,65536,0.08784000078837077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,6144,0.018365333477656048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,32,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,51200,0.07067644596099854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,16384,0.028984887732399836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,12288,0.022887999812761944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,65536,0.08296177784601848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,51200,0.06515822145673963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,10240,0.0199635558658176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,16384,0.028466665082507666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,8192,0.01720888912677765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,12288,0.023119111855824787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,7168,0.015826667348543804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,10240,0.02119111186928219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,6144,0.012531555361217923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,8192,0.019856888386938307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,5120,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,7168,0.018699554933442008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,4096,0.010488889283604093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,6144,0.017635555730925668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,3584,0.008952000074916417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,5120,0.016525333126386006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,128,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,4096,0.015492444237073263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,3072,0.008295111358165741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,2560,0.007484444313579136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,2048,0.006166222194830577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,5120,64,0.0029004443850782183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,1536,0.00517511119445165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,3072,0.014069333672523499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,2560,0.014254222313563028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,1024,0.004221333397759331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,768,0.003967111309369405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,2048,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,512,0.003491555651028951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,1536,0.013159111142158508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,1024,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,256,0.0032275555034478507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,768,0.012740444805887012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,128,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,64,0.0028862222615215513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,512,0.011797332929240333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,4096,32,0.002805333377586471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,5120,3584,0.017110221915774874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,128,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,64,0.011771555576059552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,65536,0.07551022370656331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,32,0.011019555230935415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,51200,0.06071644359164768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,16384,0.025719111164410908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,65536,0.07861510912577312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,12288,0.020745777421527438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,10240,0.017830222845077515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,51200,0.06326844294865926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,16384,0.02696000039577484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,8192,0.016062221593326993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,12288,0.022831110490692988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,7168,0.014765333798196582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,6144,0.013808888693650564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,10240,0.021104888783560857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,8192,0.01957155598534478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,5120,0.010635555618339114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,7168,0.018263111511866253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,3584,0.015467555986510383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,6144,0.017447110679414537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,3584,0.008632000121805403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,5120,0.01648622254530589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,3072,0.008044444852405125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,2560,0.007258666886223688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,4096,0.015153777268197803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,3584,0.015000889698664347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,2048,0.00591822216908137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,3072,0.01408622165520986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,1536,0.0047217777205838096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,1024,0.004202666795916027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,2048,0.012830221818553077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,1536,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,1024,0.012412444584899478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,4096,256,0.011384000380833944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,512,0.0035413333939181436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,256,0.0033368888414568375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,768,0.012463111016485425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,128,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,512,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,64,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,256,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,32,0.0029048888633648553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,128,0.011708444191349877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,64,0.010835555692513784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,65536,0.0668026672469245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,32,0.011559111376603445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,51200,0.05356088942951626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,16384,0.02166844407717387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,65536,0.0768515533871121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,4096,0.009798222117953831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,51200,0.06148799922731188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,12288,0.018339556124475267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,10240,0.016072000066439312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,8192,0.013991110854678683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,16384,0.025985777378082275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,12288,0.02221511138810052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,7168,0.013295110729005603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,10240,0.02029333346419864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,6144,0.011694221860832639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,5120,0.011065777805116443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3584,2560,0.013404444687896304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,7168,0.01811911165714264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,4096,0.009308444129096137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,3584,0.008365333080291748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,6144,0.01723911033736335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,3072,0.00797333319981893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,5120,0.01591822173860338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,4096,0.014107555150985718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,2560,0.0070879997478591064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,2048,0.005940444353553984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,3072,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,1536,0.005151111218664381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,2560,0.013413333230548434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,1024,0.0041848888827694785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,1536,0.012777778009573618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,768,0.0038693332009845306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,1024,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,512,0.0034302222645945023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,768,0.012426666915416718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,256,0.003198222153716617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,512,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,128,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,256,0.011424889167149862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,64,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,128,0.011035555766688453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3072,32,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,8192,0.019263111882739596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,64,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,32,0.01033333357837465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,65536,0.057012445396847196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,3584,768,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,51200,0.04883111185497708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,16384,0.019866666860050626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,65536,0.07420266336864896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,12288,0.016532444291644625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,10240,0.0151591118839052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,16384,0.025024000141355727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,12288,0.021753778060277302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,2048,0.013020444247457715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,10240,0.01999200052685208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,7168,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,6144,0.01168444421556261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,8192,0.01885955532391866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,5120,0.010801778071456485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,7168,0.01754577789041731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,6144,0.01647111111217075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,4096,0.008992888861232335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,3584,0.008041777544551426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,5120,0.015389333168665567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,4096,0.014456889695591398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,3072,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,2560,0.006608888920810487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,3584,0.014156444205178155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,2048,0.0058355554938316345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,3072,0.013478221992651621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,1536,0.0046862223082118565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,2048,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,1024,0.0041964443193541635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,1536,0.01276266657643848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,768,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,1024,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,3072,3584,0.014166222678290473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,51200,0.05971466832690769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,256,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,768,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,128,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,64,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,8192,0.013216888739003075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,512,0.011778666741318174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2560,32,0.002805333377586471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,256,0.011821333732869891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,128,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,65536,0.051238222254647144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,64,0.010728889041476779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,51200,0.03986666599909464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,32,0.01070577816830741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,16384,0.017321777012613084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,12288,0.015153777268197803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,65536,0.07133244143591987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,10240,0.01347555551264021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,51200,0.05772088633643257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,16384,0.024904888537194993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,8192,0.012701333396964602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,12288,0.021270222134060327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,7168,0.011533333195580376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,6144,0.011005333728260465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,10240,0.019890666007995605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,5120,0.009688888986905416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,8192,0.01780533293883006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,4096,0.009008000294367472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,6144,0.016024889217482675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,3584,0.007647111184067196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,3072,0.00628355559375551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,5120,0.015146666102939181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,4096,0.014120888378885059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,2560,0.005707555760939916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2560,2560,0.01351377781894472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,2048,0.005247999810510212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,3584,0.014274666706720987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,1536,0.0046311111913787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,3072,0.013441777891582914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,1024,0.004038222134113312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,768,0.0035582222044467926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,2560,0.013193777865833707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,2048,0.012844444149070315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,1536,0.01278222186697854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,1024,0.012411555482281579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,256,0.0031866667171319327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,768,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,128,0.002874666617976295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,512,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,64,0.002973333415057924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,256,0.012072888513406118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,128,0.0110871113008923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,64,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,65536,0.03902666767438253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,65536,0.06855911016464233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,51200,0.031139555904600356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,7168,0.016520000166363187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,16384,0.0155395550860299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,51200,0.05574311150444878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,12288,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,16384,0.02401155564520094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,10240,0.012437333663304647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,512,0.0034835553831524322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,12288,0.021107556091414556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,8192,0.01071466671095954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,10240,0.01924533314175076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,7168,0.010716444088353051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,6144,0.010728889041476779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,8192,0.01718755563100179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,5120,0.009671111073758867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,7168,0.01620444489849938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,4096,0.00815288888083564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,2048,32,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,3584,0.007311999797821045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,6144,0.01573600040541755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,3072,0.006751110984219446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,5120,0.014826666977670459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,2560,0.005881777654091517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,4096,0.014073777529928418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,3072,0.013463999662134381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,1536,0.004577777865860197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,2560,0.013415999710559845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,1024,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,2048,0.012736000120639801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,768,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,1536,0.012800888882742988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,512,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,768,0.01219733307758967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,256,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,512,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,128,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,256,0.011360000405046674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,64,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,128,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,32,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,64,0.010741333166758219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,65536,0.03019733230272929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,65536,0.065482669406467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1536,2048,0.005208000126812193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,51200,0.024325332707828943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,2048,32,0.010704889065689512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,3584,0.0144213338692983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,16384,0.012246222131782107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,12288,0.01035822182893753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,10240,0.010637332995732626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,51200,0.05242933498488533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,16384,0.022981334063741896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,8192,0.00942133367061615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,12288,0.01961688862906562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,7168,0.008639111287064022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,1024,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,10240,0.018225777480337355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,6144,0.008009778128729926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,8192,0.016572443975342643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,7168,0.015860444969601102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,4096,0.007651555869314406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,6144,0.015467555986510383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,5120,0.01459111107720269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,3072,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,4096,0.013793778088357715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,2560,0.0058764442801475525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,3584,0.014145778285132514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,2048,0.0052586665583981415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,3072,0.013402666482660504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,1536,0.004920888692140579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,2560,0.013109332985348172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,1024,0.0041911109454101985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,2048,0.01276711126168569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1536,32,0.011005333728260465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,768,0.0038604442444112566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,1536,0.012486221889654795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,512,0.0032071111102898917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,256,0.0028782222006056043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,1024,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,128,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,768,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,512,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,256,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,128,0.011015111373530494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,64,0.010701333483060202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,65536,0.02518400053183238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,1024,32,0.010718222293588849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,51200,0.020818667279349435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,5120,0.008218666745556725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,65536,0.06334488921695285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,16384,0.010938666760921478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,3584,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,12288,0.009885333478450775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,51200,0.05107288890414768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,10240,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,8192,0.01038933296998342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,7168,0.009642666412724389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,12288,0.019222221440739103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,10240,0.018219555417696636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,6144,0.008982222113344405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,8192,0.016528889536857605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,5120,0.00810222244924969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,4096,0.0075911109646161394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,7168,0.01593155496650272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,3584,0.0069191112286514705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,6144,0.015488000379668342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,3072,0.006326222171386083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,4096,0.013761777844693927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,2560,0.00589155571328269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,3584,0.013759111364682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,2048,0.005201777650250329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,3072,0.013615111509958902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,64,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,1536,0.004582222137186262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,1024,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,2560,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,1024,32,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,2048,0.012724444270133972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,768,0.003563555578390757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,512,0.003302222324742211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,1536,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,256,0.0028799999919202593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,1024,0.012156444291273752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,128,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,256,0.01142133358452055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,768,32,0.002801777794957161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,128,0.011423110961914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,64,0.01035733355416192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,65536,0.018111111389266122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,51200,0.015076445208655464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,32,0.011009777585665384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,16384,0.0107004443804423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,16384,0.021951999929216173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,65536,0.0613022247950236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,12288,0.010666666759385003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,51200,0.05131466521157158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,10240,0.009655999640623728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,8192,0.008303110798199972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,16384,0.022315555148654517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,7168,0.00794933322403166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,10240,0.018231999542978074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,8192,0.01641155613793267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,5120,0.014454222387737699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,5120,0.007965332931942409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,7168,0.016136889656384785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,4096,0.007304888632562425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,6144,0.015118221441904703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,3584,0.006615110983451207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,4096,0.014096889230940076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,3072,0.006216889040337668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,3584,0.013752000199423896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,2560,0.005629333357016246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,3072,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,768,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,2048,0.004902222090297275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,1536,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,2560,0.013112000293201871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,1024,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,2048,0.012851555314328937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,768,0.0036071112586392295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,1536,0.012772444221708508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,512,0.0031866667171319327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,1024,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,256,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,768,0.012390221986505719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,128,0.002883555574549569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,512,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,64,0.002534222271707323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,12288,0.01904622217019399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,128,0.011587555209795633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,512,6144,0.007621333003044128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,64,0.011066666907734342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,65536,0.015167999598715039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,51200,0.013337777720557319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,32,0.010008888940016428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,16384,0.009986666341622671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,12288,0.009697777529557547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,51200,0.04891733328501383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,5120,0.014491554763582019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,10240,0.009015999734401703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,16384,0.02160533269246419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,8192,0.00831200016869439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,12288,0.01924622224436866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,7168,0.009326222042242685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,6144,0.008455110920800103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,8192,0.016200888488027785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,768,512,0.01143022212717268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,7168,0.016179554992251925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,5120,0.007638221813572778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,4096,0.007265778051482306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,6144,0.015023110641373528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,3584,0.006830222076839871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,5120,0.014759999182489185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,3072,0.006607999818192587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,4096,0.013524444566832649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,2560,0.006236444330877728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,3584,0.013517333401574029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,2048,0.004860444615284602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,3072,0.013448889056841532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,1536,0.004212444441186057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,2560,0.013071111506885953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,1024,0.0038933331767717996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,512,256,0.011038222246699862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,2048,0.012447111308574677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,768,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,512,0.003245333416594399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,1536,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,256,0.0028026666906144884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,1024,0.011760888828171624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,768,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,512,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,64,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,65536,0.06091022491455078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,128,0.010679110884666443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,32,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,65536,0.01515111161602868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,64,0.010683555569913654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,10240,0.017921777235137094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,51200,0.014135110709402295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,32,0.010009778042634329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,16384,0.009318222602208456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,12288,0.008292444050312042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,65536,0.05843466520309448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,10240,0.008708444734414419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,51200,0.04736444354057312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,8192,0.00795999997191959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,12288,0.018887110882335238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,7168,0.007616000043021307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,10240,0.018219555417696636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,6144,0.007276444799370236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,8192,0.016332444217469957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,5120,0.006627555522653792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,7168,0.015818667080667283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,4096,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,6144,0.015505777464972602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,3584,0.006263999889294307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,5120,0.01445777714252472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,3072,0.005948444621430502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,4096,0.013767999907334646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,2560,0.006244444598754247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,3584,0.014168888330459595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,256,128,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,2048,0.005636444522274866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,3072,0.013091555900043912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,1536,0.004563555535342959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,256,256,0.011364444262451597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,2560,0.013064000341627332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,768,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,2048,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,512,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,1536,0.012437333663304647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,1024,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,768,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,128,0.002540444541308615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,512,0.01142133358452055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,64,0.0026151111556424033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,256,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,16384,0.021597334080272253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,128,0.010671111444632212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,65536,0.016192888220151264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,64,0.01069866700304879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,51200,0.013449778159459433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,16384,0.008199111455016667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,65536,0.056982219219207764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,12288,0.00792711145348019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,51200,0.0465866658422682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,10240,0.006968888971540663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,8192,0.0069422221018208405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,16384,0.021372444099850122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,7168,0.006559111177921295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,12288,0.01891911029815674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,10240,0.01753866672515869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,6144,0.00628266649113761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,8192,0.016519111063745286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,5120,0.005912000106440649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,4096,0.005607999861240387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,7168,0.015783111254374187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,6144,0.014840000205569796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,3584,0.005879111174080107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,3072,0.005932444499598608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,5120,0.0148026661740409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,1024,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,2560,0.00629066675901413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,4096,0.013809777796268463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,2048,0.005712000032265981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,3584,0.013897778259383308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,1536,0.00452977791428566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,3072,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,1024,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,2048,0.01278222186697854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,768,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,1024,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,512,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,768,0.01238844460911221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,256,0.0028817777832349143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,512,0.011685333318180509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,128,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,128,32,0.0099982221921285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,64,0.0025351111673646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,256,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,64,32,0.0025351111673646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,128,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,64,0.010002666877375709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,65536,0.01584533353646596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,51200,0.013449778159459433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,65536,0.05711288584603203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,51200,0.046520888805389404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,16384,0.008299555215570662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,12288,0.007275555696752336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,16384,0.02141600019401974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,10240,0.0069671107663048645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,12288,0.01882222294807434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,2560,0.013447999954223633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,8192,0.006601777755551868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,7168,0.006575111299753189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,1536,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,10240,0.017487110363112558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,6144,0.0062871111763848206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,8192,0.016897777716318767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,5120,0.005879111174080107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,7168,0.015513777732849121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,4096,0.005591111050711737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,3584,0.00590133335855272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,5120,0.01482222146458096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,3072,0.005933333188295364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,3584,0.01424888935354021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,2560,0.005607999861240387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,3072,0.013439999686347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,2048,0.005933333188295364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,2560,0.013062222136391534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,64,32,0.011009777585665384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,1536,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,1024,0.003823111040724648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,2048,0.012819555898507437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,768,0.0035217776894569397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,1536,0.012716444830099741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,512,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,1024,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,256,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,768,0.012427555190192329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,128,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,512,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,64,0.002512000087234709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,256,0.011025778121418424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,128,256,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,33,32,32,0.0024764444679021835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,128,0.011680000358157687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,64,0.011023999916182624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,32,0.010334221853150262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,6144,0.015108444624476962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,33,32,4096,0.013750221994188098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,16384,0.3696320056915283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,16384,0.17423910564846465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,51200,0.509709358215332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,12288,0.2696239948272705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,51200,1.1210613250732422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,10240,0.22906488842434355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,8192,0.18445866637759736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,8192,0.09740889072418213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,12288,0.13235467010074192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,12288,0.21569155322180855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,7168,0.1644844479031033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,16384,0.27948000695970326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,10240,0.11323377821180557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,6144,0.13915822241041395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,7168,0.08349955744213527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,10240,0.1831644508573744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,6144,0.074090666241116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,5120,0.11918132834964329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,8192,0.15216267108917236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,5120,0.06378755304548475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,4096,0.09344800313313802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,4096,0.05452088846100701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,3584,0.08329866992102729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,7168,0.1370497809516059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,3584,0.05865866608089871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,3072,0.07179199986987643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,6144,0.12156532870398627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,4096,0.09387999773025513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,5120,0.10737955570220947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,3072,0.05130489004982842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,2560,0.059551113181644015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,3584,0.09136711226569282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,2048,0.047873778475655444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,2560,0.04491110973887973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,2048,0.036638223462634616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,1536,0.03772977656788296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,3072,0.08879822492599487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,2560,0.09205866522259182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,1024,0.027080888549486797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,1536,0.030181331766976252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,2048,0.06803466876347859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,768,0.020568889048364427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,1536,0.056249777475992836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,1024,0.023656888140572443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,512,0.01407911048995124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,768,0.020598222812016804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,768,0.04221066501405504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,512,0.03616711166169908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,512,0.018431110514534842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,128,0.006909333169460297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,256,0.01586933268441094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,256,0.03187822302182516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,64,0.005975111077229182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,32,0.006250666661394968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,128,0.026446221603287592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,64,0.015483554866578845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,128,0.01479822231663598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,65536,32,0.016511110795868766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,65536,0.5401822196112739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,1024,0.04656711220741272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,65536,256,0.008273777862389883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,51200,0.8539137840270996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,65536,1.0622142155965169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,16384,0.2805742157830132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,51200,0.4119697676764594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,16384,0.1420151127709283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,12288,0.2098862197664049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,12288,0.1081848873032464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,65536,51200,0.8970426983303494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,10240,0.1745742162068685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,10240,0.09302755859163071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,8192,0.14241777526007757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,8192,0.08103111055162218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,7168,0.12529067198435465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,12288,0.18522844049665663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,10240,0.15955200460222033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,8192,0.13255822658538818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,7168,0.0695671108033922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,16384,0.23709334267510307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,6144,0.10422666867574056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,5120,0.08880444367726643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,6144,0.0620044469833374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,4096,0.07442666424645318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,5120,0.05401955710517036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,4096,0.045956446064843066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,7168,0.12005689409044053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,3584,0.06508444415198432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,6144,0.10701511303583781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,3584,0.045921779341167875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,5120,0.0951404439078437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,3072,0.05669244130452474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,4096,0.08252088891135322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,2560,0.04837333493762546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,3072,0.041137778096728854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,3584,0.0770124461915758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,3072,0.07068355878194173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,2560,0.03608622153600057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,2560,0.08006044228871663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,1536,0.02976800004641215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,2048,0.05968978007634481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,1024,0.02219111058447096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,1536,0.05060088965627882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,1024,0.020582222276263766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,768,0.01661333276165856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,1024,0.04316533274120755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,768,0.039064000050226845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,512,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,512,0.017017778423097398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,2048,0.038718223571777344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,256,0.0075937774446275495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,512,0.03420266509056091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,2048,0.0318488876024882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,256,0.014139556222491793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,128,0.004181333300140169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,256,0.029373334513770208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,1536,0.026505778233210247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,128,0.013824889229403602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,32,0.0038728887836138406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,128,0.0247706671555837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,51200,0.7223644256591797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,64,0.014431110686726041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,32,0.015232000086042615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,51200,768,0.018788443671332467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,65536,0.3614959981706407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,51200,0.2618853251139323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,65536,0.200436446401808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,51200,65536,0.9054684109157987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,16384,0.08031200038062201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,12288,0.062131557199690074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,51200,0.15052799383799234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,16384,0.05826666620042589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,10240,0.05167466733190748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,12288,0.046428445312711925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,10240,0.0410462220509847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,8192,0.04414577616585625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,51200,64,0.003670222229427762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,16384,0.07272977961434259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,7168,0.037392000357309975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,10240,0.05459644397099813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,8192,0.037534223662482366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,6144,0.0326533317565918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,7168,0.03252266512976752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,8192,0.04871733321083916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,6144,0.030047112041049536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,7168,0.04554133282767402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,5120,0.028224001328150432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,4096,0.02308888898955451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,6144,0.04208533300293816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,5120,0.026867555247412786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,3584,0.02088088956144121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,5120,0.03983644313282437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,4096,0.023408000667889912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,4096,0.0369137790468004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,3072,0.01832799944612715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,51200,0.16646044784122044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,3584,0.024028443627887305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,3584,0.035530666510264076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,2560,0.015775110986497667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,65536,0.21177332931094697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,2048,0.013103110922707452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,3072,0.021741333934995864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,3072,0.035036444664001465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,1536,0.010642666783597736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,2560,0.020869332883093093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,2560,0.0322035551071167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,1024,0.008391111261314815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,2048,0.03112444281578064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,1536,0.028668443361918133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,1024,0.026733333865801494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,1024,0.015005333556069268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,512,0.005581333405441708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,12288,0.06260799699359469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,768,0.025036444266637165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,256,0.0037662221325768363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,768,0.014141332772043018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,512,0.02197155521975623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,512,0.01277955538696713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,128,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,256,0.01994755533006456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,256,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,64,0.0029004443850782183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,16384,128,0.018955555227067735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,128,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,64,0.012416889270146688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,32,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,65536,0.2589804331461589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,65536,0.16947733031378853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,51200,0.2027155558268229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,51200,0.1314800050523546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,768,0.007096889118353526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,2048,0.01852799952030182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,16384,1536,0.017328888177871704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,16384,0.073161780834198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,12288,0.05776266919242012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,16384,0.051517334249284535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,10240,0.04736622174580892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,12288,0.04144355654716492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,16384,0.06405778063668145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,16384,32,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,10240,0.0369120008415646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,12288,0.053898665640089244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,8192,0.03844533363978068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,7168,0.03291733397377862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,8192,0.03324888812171088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,10240,0.04909155435032315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,7168,0.029615110821194116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,6144,0.028852442900339764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,5120,0.024937777055634394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,7168,0.0414648883872562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,6144,0.026936888694763184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,65536,0.17938489384121367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,6144,0.03959555427233378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,5120,0.023398222194777593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,3584,0.01850222216712104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,5120,0.03701600101259019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,51200,0.14169243971506754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,4096,0.033209777540630765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,4096,0.02163999941613939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,3072,0.016674665941132438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,3584,0.02215733296341366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,3584,0.03258488906754388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,2560,0.013843555417325763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,3072,0.03288177649180094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,3072,0.020584889584117465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,2048,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,1536,0.009645333720578088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,2560,0.019142222073343065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,2560,0.03011911114056905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,2048,0.029097778929604426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,1024,0.008210666477680206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,1536,0.027890665663613215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,768,0.006606222026877933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,2048,0.01761511133776771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,1024,0.013738666971524557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,1024,0.023938667443063524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,512,0.004655111167165968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,768,0.022862222459581163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,768,0.01344622257683012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,256,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,512,0.012376888758606382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,512,0.02165866725974613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,8192,0.04519822200139364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,256,0.011733333269755045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,256,0.01994222237004174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,64,0.003208000005947219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,4096,0.02188355558448368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,12288,128,0.01788444485929277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,128,0.011753777662913004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,32,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,64,0.011628444823953839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,32,0.011472889118724398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,65536,0.22950755225287545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,65536,0.16143200132581922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,51200,0.18058310614691842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,16384,0.06229066848754883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,12288,1536,0.01603555513752831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,51200,0.12640533182356092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,16384,0.04934222168392605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,12288,0.04782933327886793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,12288,0.03961777687072754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,16384,0.06025155385335287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,10240,0.04102844330999587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,12288,0.051960001389185585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,8192,0.035340444909201726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,10240,0.03592177894380357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,10240,0.047367999951044716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,51200,0.13403556081983778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,65536,0.16380711396535239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,7168,0.026297777891159058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,8192,0.04270311196645101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,8192,0.031382222970326744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,7168,0.028813332319259644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,7168,0.04048177931043837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,6144,0.025377778543366328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,5120,0.021235555410385132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,6144,0.03934489025010003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,4096,0.01796711153454251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,5120,0.022966222630606756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,5120,0.035595556100209556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,4096,0.021199110481474135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,4096,0.03429422113630507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,3072,0.013640888863139682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,3584,0.020900444851981267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,3584,0.0321395562754737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,2560,0.01202400028705597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,3072,0.019857777489556205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,3072,0.03215822246339586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,2048,0.01069777790043089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,2560,0.03048711021741231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,12288,128,0.0032186667538351486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,1536,0.009011555876996782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,2048,0.01722311145729489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,2048,0.03039111031426324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,1024,0.007661333514584436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,1536,0.027391110857327778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,1536,0.01551999979548984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,1024,0.013796444568369122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,1024,0.024392000503010217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,512,0.0047733332547876565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,768,0.022659555077552795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,768,0.012784000072214337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,6144,0.023285332653257582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,256,0.003867555409669876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,512,0.012381333443853589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,128,0.0034942221310403612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,256,0.021035555336210463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,256,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,64,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,128,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,128,0.018953777021831937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,32,0.00313688897424274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,64,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,3584,0.015861334072219003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,32,0.011767999993430244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,65536,0.17538666725158691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,65536,0.11228888564639622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,51200,0.12714132997724745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,10240,2560,0.0181351105372111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,16384,0.046781334612104625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,51200,0.08755111032062107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,12288,0.03660533494419522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,16384,0.03743911120626662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,10240,768,0.005896889087226655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,10240,0.027913779020309448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,16384,0.059248891141679555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,12288,0.031097776359981958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,8192,0.023745778534147475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,12288,0.051113777690463595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,10240,0.027855998939938013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,10240,512,0.02197333342499203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,7168,0.020996444755130347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,10240,0.04703022374047173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,8192,0.023958222733603582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,6144,0.018339556124475267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,8192,0.04184622234768338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,65536,0.16051910983191595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,51200,0.13134845097859701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,7168,0.02295555505487654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,5120,0.01605955594115787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,4096,0.014195554786258273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,6144,0.020770667327774894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,6144,0.03712177938885159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,5120,0.03634044528007507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,5120,0.019311999281247456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,3584,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,3072,0.011136888629860349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,4096,0.03393777873780992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,4096,0.017861333158281114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,3584,0.031707555055618286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,3584,0.018561777141359117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,2560,0.009689778089523315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,2048,0.008604444563388824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,3072,0.016938666502634685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,3072,0.03218844532966614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,2560,0.03051999873585171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,2560,0.016348444753222995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,1536,0.007276444799370236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,1024,0.005979555762476391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,2048,0.015403555499182807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,2048,0.029363556040657893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,768,0.004519111166397731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,1536,0.014461333552996317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,1024,0.023016000787417095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,1024,0.013067555924256643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,512,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,768,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,768,0.022643556197484333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,256,0.003206222214632564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,512,0.012289777398109436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,512,0.020561777883105807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,256,0.01955111159218682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,128,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,256,0.012087110843923358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,8192,32,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,128,0.011352889239788055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,128,0.017913776967260573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,64,0.011906666888131036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,7168,0.0403164459599389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,8192,32,0.011733333269755045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,65536,0.15423822402954102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,51200,0.12207644515567356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,65536,0.10489688979254828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,16384,0.043748444981045194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,51200,0.08097066481908162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,16384,0.035423109928766884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,12288,0.03487199876043532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,12288,0.02923111120859782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,8192,1536,0.025456888808144465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,16384,0.05859377649095324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,12288,0.051071110698911876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,8192,0.021903110875023737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,10240,0.026191110412279766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,10240,0.046406222714318164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,51200,0.13053511248694524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,65536,0.1604479948679606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,8192,0.02366311185889774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,7168,0.019183110859658983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,6144,0.016872889465755887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,8192,0.04177688890033298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,5120,0.014420444766680399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,7168,0.02127555509408315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,7168,0.039460443788104586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,6144,0.020008888509538438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,4096,0.012995555169052549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,6144,0.037568890386157565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,3584,0.011429333024554782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,5120,0.018573333819707234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,5120,0.035777777433395386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,3072,0.010129777921570672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,4096,0.03221777743763394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,4096,0.01754133403301239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,3584,0.017836444907718234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,2560,0.008665777742862701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,3584,0.031721777386135526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,2048,0.008255999949243333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,3072,0.030790223015679255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,3072,0.017062221964200337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,2560,0.029979556798934937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,2560,0.016144000821643405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,2048,0.014196443888876172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,2048,0.02735200027624766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,1536,0.013526221944226159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,768,0.00423911131090588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,1024,0.023141332798533972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,1024,0.012576888832781049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,512,0.0038844446341196695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,768,0.022321777211295232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,10240,0.02982399861017863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,768,0.012457778056462606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,256,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,512,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,512,0.02093244426780277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,128,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,256,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,256,0.01956622302532196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,64,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,128,0.011348444554540845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,128,0.018886221779717337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,32,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,64,0.011027555498811932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,7168,32,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,65536,0.12506843937767878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,65536,0.0973022249009874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,51200,0.09916444619496663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,1536,0.006945778098371293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,51200,0.07461244530147977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,7168,1024,0.005233777893914117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,16384,0.03762755460209317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,12288,0.030291554000642564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,16384,0.03327022327317132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,12288,0.027036445008383855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,16384,0.05876444445716011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,10240,0.02611733310752445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,12288,0.05027911067008972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,65536,0.15978933705223933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,10240,0.024192000428835552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,8192,0.02225688927703434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,10240,0.04583466715282864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,7168,0.019893333315849304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,8192,0.022299556268586054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,8192,0.04209511147605049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,7168,0.020279111133681405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,7168,0.0384808878103892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,6144,0.017500445246696472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,5120,0.0158933334880405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,6144,0.01940711173746321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,6144,0.03643200132581923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,5120,0.018079110317760043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,5120,0.03491200009981791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,3584,0.009993777506881291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,4096,0.01685244507259793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,4096,0.03326844506793552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,3072,0.009710222482681274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,3584,0.017270222306251526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,3584,0.03142666816711426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,2560,0.008279999925030602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,3072,0.016180444094869826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,3072,0.030590222941504583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,2048,0.0075911109646161394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,2560,0.015449777245521545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,2560,0.02999911043379042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,1536,0.006596444381607904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,2048,0.013763555222087435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,2048,0.02678933408525255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,1024,0.004922666483455234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,1536,0.013428444663683573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,1536,0.025751999682850305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,51200,0.13036978244781494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,768,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,1024,0.012390221986505719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,1024,0.023099554909600153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,512,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,768,0.02160888910293579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,768,0.012080888781282636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,512,0.020624889267815482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,512,0.012102222277058495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,128,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,256,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,256,0.01939288940694597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,64,0.0028035555862718155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,128,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,6144,128,0.01792355544037289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,32,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,64,0.011004444625642566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,6144,32,0.011015111373530494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,65536,0.11036444372600979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,7168,1536,0.025068443682458665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,51200,0.08780711226993138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,65536,0.08700355556276108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,16384,0.033004442850748696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,51200,0.06867555777231853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,16384,0.031063109636306763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,12288,0.02661688956949446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,16384,0.058238221539391406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,256,0.0031991110493739447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,12288,0.02465244465404087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,65536,0.15905955102708605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,12288,0.04954222175810072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,10240,0.023456000619464453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,51200,0.13038578298356798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,8192,0.020652444826232064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,6144,4096,0.01181333346499337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,10240,0.022096888886557683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,10240,0.04560533497068617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,8192,0.02091111077202691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,8192,0.04167200128237406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,6144,0.016194666425387066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,5120,0.014128888646761576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,7168,0.01978755493958791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,7168,0.03831377625465393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,6144,0.01865511139233907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,6144,0.03647644321123759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,5120,0.01763288842307197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,5120,0.03563022282388475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,3584,0.009686222506894005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,4096,0.0332622230052948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,3584,0.01657511128319634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,3072,0.00904088881280687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,3584,0.031726221243540444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,3072,0.03161066770553589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,3072,0.01552177800072564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,2560,0.007941332956155142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,2560,0.014473777678277759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,2048,0.006883555402358373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,7168,0.017779555585649278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,2048,0.013834666874673633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,1536,0.006224888894293044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,2048,0.026085333691702947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,1536,0.013281777501106262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,4096,0.010325333310498131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,1536,0.02437777817249298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,1024,0.0047377778424157035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,768,0.0042151109211974675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,4096,0.01647733317481147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,1024,0.022970666488011677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,512,0.003900444342030419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,768,0.012381333443853589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,768,0.023418666587935552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,256,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,512,0.021055999729368422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,512,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,128,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,256,0.021270222134060327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,256,0.011680000358157687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,64,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,128,0.018537777993414137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,128,0.0110880004035102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,5120,32,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,64,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,65536,0.08823733197318183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,32,0.0107342220014996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,5120,2560,0.029457777738571167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,51200,0.07065955797831218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,16384,0.026884444885783728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,51200,0.06409244404898749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,12288,0.02127200033929613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,16384,0.028460443019866943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,16384,0.05800977680418226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,12288,0.022795556320084467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,10240,0.018535999788178336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,12288,0.04924799998601278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,65536,0.15848622057172987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,8192,0.016525333126386006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,5120,1024,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,10240,0.02128177715672387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,10240,0.04519022173351712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,7168,0.014576888746685453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,8192,0.04046577877468533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,6144,0.013445333474212222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,7168,0.03887822230656942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,7168,0.018304889400800068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,5120,0.012657778130637275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,6144,0.018033777674039204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,4096,0.011010666688283285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,5120,0.016535111599498324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,5120,0.03439199924468994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,3584,0.010220444036854638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,4096,0.015437333120240105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,4096,0.031383110417260066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,65536,0.08093866374757555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,3072,0.009047110875447592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,3584,0.015456888410780164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,3584,0.03122133347723219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,2560,0.008292444050312042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,3072,0.01441333360142178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,2048,0.006414222220579783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,2560,0.013749333719412485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,2048,0.025978666212823655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,51200,0.1305262247721354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,1536,0.013080000049538083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,8192,0.019890666007995605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,1024,0.00388711111413108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,1536,0.02510044475396474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,6144,0.03608977794647217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,1024,0.012416000167528788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,768,0.003826666623353958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,1024,0.022981334063741896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,512,0.0032071111102898917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,768,0.02158755560715993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,768,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,256,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,512,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,512,0.020628444022602506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,128,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,256,0.011462222370836469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,256,0.020925333102544148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,3072,0.028920888900756836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,128,0.011000889043013254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,2560,0.027401778433057997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,32,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,64,0.0107022225856781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,65536,0.07609155442979601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,2048,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,4096,32,0.010692444112565784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,1536,0.004920888692140579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,51200,0.061512887477874756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,65536,0.0785342190000746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,16384,0.02453600035773383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,51200,0.06295110781987508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,16384,0.026384888423813715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,16384,0.05738311343722873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,12288,0.01965777741538154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,65536,0.15946577654944524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,51200,0.13049422370062932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,10240,0.01735466718673706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,12288,0.022272000710169475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,12288,0.04920444554752774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,8192,0.01521511044767168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,10240,0.0207368897067176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,10240,0.04508622156249153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,7168,0.013635555903116861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,8192,0.01941688855489095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,8192,0.04040088918473985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,6144,0.012958221965365939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,4096,64,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,7168,0.018716444571812946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,7168,0.03906666570239597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,5120,0.012257777982287936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,4096,128,0.019254222512245178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,4096,0.01038933296998342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,6144,0.037017779217825994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,5120,0.03387466735310025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,3584,0.009321778184837764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,5120,0.01667288939158122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,3072,0.008634666601816813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,4096,0.03302399979697333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,4096,0.01531555586391025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,3584,0.030645334058337744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,2560,0.00797155582242542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,3072,0.029116445117526587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,3072,0.014449778530332776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,2048,0.006169777777459886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,2560,0.028038223584493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,1536,0.004861333303981357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,2048,0.013428444663683573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,2048,0.02677333354949951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,1024,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,1536,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,1536,0.025395555628670588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,768,0.0035342222286595237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,1024,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,1024,0.02345866627163357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,512,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,768,0.012415111064910889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,512,0.011778666741318174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,512,0.02162844439347585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,256,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,6144,0.01722311145729489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,256,0.02057422200838725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,256,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,128,0.0028008888992998335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,64,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3584,32,0.002536888958679305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,128,0.019556444552209642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,128,0.011443555355072021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,64,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,3584,0.014719110396173267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,65536,0.06716889142990112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,32,0.01073333372672399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,51200,0.05156266689300537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3584,2560,0.013351110948456658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,65536,0.07629688580830891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,51200,0.06113511323928833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,12288,0.017549332645204332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,16384,0.026165333059098985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,16384,0.05729866690105862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,10240,0.015547555353906421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,12288,0.02215555475817786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,65536,0.1588266690572103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,51200,0.12968711058298746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,12288,0.04883644315931532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,8192,0.013746666411558786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,7168,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3584,768,0.022302221920755174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,10240,0.02052533295419481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,10240,0.04522933231459724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,8192,0.01902844508488973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,6144,0.01167377746767468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,5120,0.0107342220014996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,7168,0.017934223016103108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,7168,0.038520889149771795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,4096,0.00980000032318963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,6144,0.03667555583847894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,5120,0.016117332710160148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,5120,0.03423110975159539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,3584,0.008624888956546783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,4096,0.031735112269719444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,4096,0.01516355574131012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,3072,0.007658667034573025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,3584,0.014163555370436775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,3584,0.03150577677620782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,2560,0.006956444846259222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,3072,0.013763555222087435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,3072,0.027535999814669292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,2048,0.005597333527273602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,2560,0.013631111217869652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,2560,0.027455111344655354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,16384,0.021387555532985266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,1536,0.004553777890072929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,2048,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,2048,0.02608088817861345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,1024,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,1536,0.02513866623242696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,1536,0.012448000411192576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,768,0.003539555602603488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,1024,0.012215110990736218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,1024,0.022966222630606756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,512,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,768,0.022287999590237934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,768,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,256,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,512,0.011869333684444427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,512,0.021594666772418555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,128,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,8192,0.039545777771208025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,256,0.020768000019921195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,64,0.0025457777082920074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,3072,128,0.018253333038753934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,3072,32,0.002529777793420686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,6144,0.01748533381356133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,65536,0.05923822191026476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,32,0.0107342220014996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,51200,0.046556442975997925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,51200,0.059246222178141274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,65536,0.15849955876668295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,16384,0.019633778267436557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,16384,0.025027554896142747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,51200,0.12957689497205946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,12288,0.01601777805222405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,16384,0.05654222435421414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,12288,0.02161066730817159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,10240,0.014095111025704278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,12288,0.04897333184878031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,128,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,8192,0.012483555409643384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,64,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,10240,0.020059555768966675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,7168,0.011691555380821228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,8192,0.01909955508179135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,65536,0.07345955239401923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,8192,0.040720889965693154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,6144,0.010857777463065254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,7168,0.017720000611411203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,7168,0.039108445247014366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,5120,0.010262221925788457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,6144,0.01647733317481147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,6144,0.036657777097490095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,4096,0.008960000342792934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,5120,0.03337688909636603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,3584,0.00793866647614373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,4096,0.031114667654037476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,4096,0.014902222487661572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,3072,0.006981333096822103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,3584,0.013812444276279874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,3072,0.01389955480893453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,2560,0.006258666515350342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,3072,0.02773511078622606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,3072,256,0.011389333340856763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,2560,0.013431111143694984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,2048,0.005241777747869492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,2048,0.01310400002532535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,2048,0.02576711111598545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,10240,0.0444124440352122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,1536,0.02400355537732442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,1536,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,1024,0.0038657776183552216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,1024,0.02281155520015293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,768,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,5120,0.016113777955373127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,768,0.011767110890812345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,768,0.02273599969016181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,512,0.0032177778581778207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,3584,0.029397332006030615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,256,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,512,0.020922667450375024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,512,0.011737777955002256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,128,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,256,0.011764444410800934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,256,0.01955911186006334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,64,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,128,0.017862222260899015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,128,0.011371555427710215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2560,2560,0.02741333345572154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,65536,0.04826755656136406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,64,0.010695999695195092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,32,0.010391111175219217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,51200,0.03765955567359924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,65536,0.0707262224621243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,1536,0.00452977791428566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,16384,0.015875554747051664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,51200,0.05670577949947781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,12288,0.013384888569513956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,16384,0.025213332639800176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,16384,0.05653599898020426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,51200,0.1298826667997572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,10240,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2560,1024,0.012111110819710625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,12288,0.02163377735349867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,12288,0.04837422238455879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,8192,0.013073777986897362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,10240,0.01973511113060845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,10240,0.044646223386128746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,7168,0.012712000144852532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,8192,0.018537777993414137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,8192,0.04073511229621039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,6144,0.011693333586057028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,7168,0.017180444465743173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,7168,0.038146668010287814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,5120,0.010663111176755695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,6144,0.01650399963061015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,6144,0.035664889547559954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,4096,0.009694221946928237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,5120,0.01517777807182736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,5120,0.03179377648565505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2560,32,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,3584,0.009013333254390294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,4096,0.013980444934633044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,3072,0.00655733338660664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,4096,0.030821333328882854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,2560,0.005964444329341252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,3584,0.029409776131312054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,3584,0.01388177772363027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,3072,0.02741777731312646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,2048,0.005260444349712796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,2560,0.013453333742088742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,2560,0.027314666244718764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,1536,0.0047484445903036325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,2048,0.025812443759706285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,2048,0.01274222218328052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,1024,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,1536,0.025411556164423626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,1536,0.012716444830099741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,768,0.0038693332009845306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,65536,0.15847199492984348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,1024,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,512,0.003379555626047982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,768,0.022261333134439256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,768,0.012116444607575735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,256,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,512,0.02160177793767717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,512,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,128,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,256,0.011720000041855706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,256,0.02127644419670105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,64,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,128,0.01891288823551602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,2048,32,0.00254133323000537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,65536,0.037235554721620344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,64,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,32,0.011006222003036074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,51200,0.029535111453798082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,65536,0.06864621904161242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,65536,0.15930133395724827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,51200,0.05466755562358432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,3072,0.013482666677898832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,16384,0.013518222504191928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,12288,0.011708444191349877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,51200,0.13034133116404215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,16384,0.05646755297978719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,16384,0.024311999479929607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,10240,0.016864000095261466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,12288,0.021156445145606995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,12288,0.04901688959863451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,8192,0.014817777607176038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,2048,1024,0.0229120006163915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,10240,0.019188443819681805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,7168,0.013528000149461957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,10240,0.04438044296370613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,6144,0.012454222473833295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,8192,0.03990844554371304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,8192,0.01719199948840671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,7168,0.0373599992858039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,5120,0.011257777611414591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,7168,0.01648622254530589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,4096,0.00997155573632982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,6144,0.03522577881813049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,6144,0.015504888362354703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,3584,0.009145778086450364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,2048,128,0.011008888483047485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,5120,0.032935112714767456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,5120,0.014785778191354541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,3072,0.006272000157170826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,4096,0.030999110804663763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,4096,0.014126222994592456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,2560,0.005590222362014983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,3584,0.013794666363133324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,3072,0.028797331783506606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,3072,0.013428444663683573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,2560,0.013053333593739403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,2560,0.027097778187857732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,1536,0.004511111312442356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,2048,0.025417778227064345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,2048,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,1024,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,1536,0.01276266657643848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,1536,0.025070221887694463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,768,0.0037164443896876443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,1024,0.01240799989965227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,768,0.012038222617573209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,512,0.003206222214632564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,768,0.022301332818137273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,256,0.0029395555870400537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,512,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,512,0.020582222276263766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,128,0.002805333377586471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,256,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,256,0.02090222140153249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,64,0.002805333377586471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,128,0.010741333166758219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,128,0.019239111079110038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,32,0.0026293332791990707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,65536,0.025974222355418738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,64,0.011062222222487131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1536,32,0.011372444530328115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,3584,0.028774221738179524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1536,2048,0.005664888769388199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,65536,0.06499110990100436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,16384,0.01348000019788742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,65536,0.15859022405412462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,51200,0.05260266529189216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,12288,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,51200,0.1293048858642578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,16384,0.0233262214395735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,16384,0.056536886427137584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,10240,0.010796444283591377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1536,1024,0.02311822275320689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,12288,0.04726577798525492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,8192,0.009922666682137383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,10240,0.04321066538492838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,7168,0.008621333373917473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,8192,0.016823111308945548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,7168,0.016156444946924847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,7168,0.036009778579076133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,6144,0.008300444318188561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,6144,0.0332640012105306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,6144,0.015279110934999255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,5120,0.007253333098358578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,5120,0.031735112269719444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,5120,0.014649778604507446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,51200,0.022229333718617756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,4096,0.007324444750944774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,3584,0.006989333364698622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,4096,0.03050400151146783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,3584,0.013468444347381592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,3072,0.006264888991912206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,3584,0.02915466825167338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,12288,0.019558222757445443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,3072,0.028877334462271795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,3072,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,2560,0.005872888697518243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,2048,0.005879111174080107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,2560,0.026387555731667414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,2560,0.013090666797426013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,8192,0.039453334278530545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,1536,0.004932444542646408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,2048,0.012522666818565793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,2048,0.025769778423839148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,1024,0.004237333519591225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,1536,0.025016888976097107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,1536,0.012777778009573618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,768,0.0038311113086011675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,1024,0.02252888845072852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,1024,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,512,0.0034933334423436057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,768,0.02234488891230689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,768,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,256,0.0032355555643637977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,128,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,512,0.0207368897067176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,512,0.011372444530328115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,64,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,256,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,1024,32,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,128,0.01772622267405192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,128,0.01073155552148819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,65536,0.022092445029152766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,4096,0.013768889009952545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,64,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,51200,0.018576888574494254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,32,0.011388444238238864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,16384,0.015066666735543145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,65536,0.0624248915248447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,51200,0.05128177669313219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,65536,0.15794844097561306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,12288,0.009950222240553962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,51200,0.12896622551812068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,16384,0.0229751103454166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,16384,0.05532711082034641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,10240,0.008976000050703684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,1024,10240,0.01833422150876787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,8192,0.00868977771864997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,12288,0.0473235547542572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,12288,0.01921599937809838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,7168,0.008289777570300633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,8192,0.03770666652255588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,8192,0.016536888149049547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,6144,0.007687110867765214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,7168,0.0159288893143336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,7168,0.03588711222012838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,5120,0.007316444483068254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,6144,0.015454222758611044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,5120,0.014498665928840637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,5120,0.03217688865131802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,4096,0.007374222079912822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,1024,256,0.020999999509917364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,3584,0.007308444215191736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,4096,0.02882933285501268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,4096,0.014089778065681458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,3072,0.0069546666410234236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,3584,0.013779555757840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,3584,0.028833776712417603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,2560,0.006616000086069107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,3072,0.013455111119482251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,3072,0.028794666131337483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,2048,0.005247999810510212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,2560,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,2560,0.027849776877297297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,1536,0.004559111264016894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,2048,0.01293955577744378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,2048,0.025399110383457605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,10240,0.042423999971813627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,1536,0.01238044434123569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,1536,0.025380444195535447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,768,0.003597333199448056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,1024,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,1024,0.023423999547958374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,512,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,768,0.012092444631788464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,6144,0.03390044305059645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,768,0.02102577851878272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,256,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,512,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,128,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,256,0.011063111325105032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,256,0.01936444474591149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,64,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,128,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,128,0.017883555756674874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,64,0.01036711119943195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,65536,0.02949955397182041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,32,0.01070755554570092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,51200,0.023687111006842718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,65536,0.06156088908513387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,65536,0.15789600213368735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,16384,0.01001422190003925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,51200,0.0503057771258884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,51200,0.12837333149380153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,768,10240,0.018221333622932434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,12288,0.008989333278603023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,16384,0.02196888956758711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,16384,0.05504088931613498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,10240,0.007631999750932057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,12288,0.0195777780479855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,10240,0.04280266828007168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,8192,0.008301333420806462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,8192,0.037639998727374606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,8192,0.016505777835845947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,7168,0.008272888759771982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,7168,0.0358915560775333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,6144,0.007600888609886169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,6144,0.01552888916598426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,6144,0.03446311089727614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,5120,0.006970666348934174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,768,1024,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,5120,0.014838222000333997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,4096,0.007382222347789341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,5120,0.03126488791571723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,12288,0.0462026662296719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,4096,0.014136888914638095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,10240,0.01753422286775377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,4096,0.028824888997607764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,3072,0.006912888752089606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,3584,0.02846933404604594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,3584,0.013749333719412485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,768,512,0.021627555290857952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,3072,0.013085333009560903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,3072,0.027404444085227117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,2048,0.006579555571079254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,7168,0.016148444679048326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,2560,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,2560,0.027110222313139174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,1536,0.004267555558019214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,2048,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,2048,0.026038222842746313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,1024,0.0038986665507157645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,1536,0.025380444195535447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,768,0.0036888888312710654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,1024,0.01202400028705597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,1024,0.021957332889238994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,512,0.003152888889114062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,768,0.012080888781282636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,768,0.02312711046801673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,512,0.011408000356621213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,256,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,512,0.02127200033929613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,128,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,256,0.010856000085671743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,3584,0.007251555720965068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,128,0.017619555195172627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,128,0.010413332945770687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,64,0.010053333308961656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,512,2560,0.006635555376609166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,32,0.010397333237859938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,51200,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,65536,0.06004177861743503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,65536,0.15781244966718885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,16384,0.008984888593355814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,51200,0.04880533284611172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,512,1536,0.012074666718641916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,51200,0.12816888756222194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,12288,0.008303999900817871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,16384,0.021969777014520433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,16384,0.05411377880308363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,10240,0.007840000092983246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,12288,0.0188755558596717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,12288,0.045547554890314736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,8192,0.006934222247865465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,10240,0.04247200157907274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,7168,0.006623999940024481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,8192,0.016241777274343703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,8192,0.0366613335079617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,6144,0.006596444381607904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,7168,0.016211556063758004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,512,256,0.020970667401949566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,7168,0.03577422102292379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,5120,0.006219555520349079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,6144,0.014867555763986377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,6144,0.03425155414475335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,4096,0.005955555372767978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,5120,0.031855109665128924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,5120,0.014434667097197639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,65536,0.01514933341079288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,4096,0.02843822373284234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,4096,0.014115555418862237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,3072,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,3584,0.013432888521088494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,3584,0.028423110644022625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,2560,0.00628355559375551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,3072,0.027054222093688116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,3072,0.013468444347381592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,2048,0.005910222315125995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,2560,0.026844445202085707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,2560,0.012770666844315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,1536,0.004229333251714706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,2048,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,2048,0.02495288848876953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,1024,0.003903999924659729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,1536,0.024051555328898962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,1536,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,768,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,1024,0.022682666778564453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,1024,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,512,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,10240,0.017906667457686532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,768,0.011733333269755045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,768,0.02158044444190131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,256,0.0029297777348094513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,128,0.002558222247494592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,512,0.02130577796035343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,512,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,64,0.0025928889711697898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,256,0.011006222003036074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,32,0.002524444419476721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,128,0.01885600056913164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,128,0.010422222316265106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,65536,0.014764444695578681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,64,0.010050666828950247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,256,32,0.010424888796276517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,65536,0.059192001819610596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,256,3584,0.006584888945023219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,16384,0.007987555530336168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,65536,0.15591111448076037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,51200,0.04710666669739617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,12288,0.007650666766696506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,51200,0.1273768875333998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,16384,0.02162222233083513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,16384,0.0545457767115699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,10240,0.007280000381999546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,8192,0.007051555646790399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,12288,0.04610400067435371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,12288,0.01887911061445872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,7168,0.006301333506902059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,10240,0.01787911189926995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,8192,0.016193777322769165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,8192,0.037314666642083064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,6144,0.006518222391605377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,7168,0.03640710976388719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,7168,0.015832889411184523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,5120,0.005931555396980709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,5120,0.014447111222479077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,6144,0.01482311056719886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,6144,0.033886220720079206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,256,256,0.020232000284724765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,4096,0.0058293334311909145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,3584,0.006268444574541516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,5120,0.03153955605294969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,4096,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,3072,0.005917333480384614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,51200,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,3584,0.013437333206335703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,3584,0.028428445259730022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,3072,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,2560,0.012773333324326409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,2048,0.005904888941182031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,2560,0.026778666509522334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,2048,0.025376889440748427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,2048,0.01255022237698237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,1536,0.00453599997692638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,10240,0.04242222176657783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,1024,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,1536,0.0239991115199195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,1024,0.012111999922328524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,768,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,1024,0.0225262227985594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,768,0.021943110558721755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,768,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,512,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,4096,0.0288355549176534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,512,0.011768889096048145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,256,0.0030942221896515954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,2560,0.0058986664646201665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,128,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,256,0.01142133358452055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,3072,0.026732444763183594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,64,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,128,0.018584888842370775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,128,0.010407110883129967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,128,32,0.002530666689078013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,65536,0.011409777734014722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,64,0.009853333234786987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,51200,0.00998933364947637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,32,0.01033155537313885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,16384,0.007242666350470648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,65536,0.057561775048573814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,12288,0.006596444381607904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,51200,0.04630400074852837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,128,1536,0.01240533341964086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,16384,0.021312000022994146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,8192,0.0062871111763848206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,12288,0.019268444842762418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,10240,0.01751377847459581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,7168,0.006304889089531369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,6144,0.0063386667105886675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,8192,0.016180444094869826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,5120,0.005594666633341048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,7168,0.015806222955385845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,4096,0.005559999909665849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,512,0.02092622220516205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,5120,0.014475555883513557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,3584,0.005949333310127258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,3072,0.005934222290913264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,4096,0.013753777576817406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,2560,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,3584,0.013390222357379066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,3072,0.01309866706530253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,2048,0.005530666559934616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,1536,0.004545777622196409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,2560,0.01274222218328052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,1024,0.003621333175235324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,2048,0.012732444538010491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,768,0.003256888853179084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,1536,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,512,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,1024,0.011762667033407422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,256,0.002599999929467837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,768,0.011688888900809817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,128,0.002492444382773505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,512,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,64,0.002491555487116178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,10240,0.006070222291681502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,256,0.01092888911565145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,64,32,0.002469333302643564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,128,0.010676444404655032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,65536,0.008982222113344405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,64,0.01033155537313885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,51200,0.008330666356616551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,32,0.01036622209681405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,16384,0.006641777853171031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,12288,0.005881777654091517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,65536,0.05646489063898722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,10240,0.00629688882165485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,64,6144,0.015178667174445258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,16384,0.021382222572962444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,8192,0.005607999861240387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,12288,0.018580444984965853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,7168,0.006253333141406377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,6144,0.006261333409282897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,10240,0.017557332913080852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,8192,0.016413332687483895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,5120,0.005491555564933353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,32,128,256,0.019959999455346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,7168,0.015459555718633862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,4096,0.0052791109515561005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,3584,0.005949333310127258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,5120,0.01443199978934394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,3072,0.005538666827811136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,4096,0.013528889252079858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,2560,0.005619555711746216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,3584,0.013451555536852943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,2048,0.005558222118351195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,2560,0.01275644451379776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,1536,0.0041742221348815495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,1024,0.003563555578390757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,2048,0.0123831108212471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,768,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,1536,0.01275199982855055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,512,0.0031946665710873077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,768,0.011687999798191918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,256,0.002487999904486868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,512,0.012072000238630505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,128,0.002512000087234709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,51200,0.04653155472543505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,256,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,64,0.0025333333760499954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,32,32,32,0.002480888946188821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,128,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,64,0.01035911093155543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,32,0.010320888625250923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,6144,0.01517955627706316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,3072,0.01312800000111262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,16384,0.17215822802649605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,16384,0.3618488841586643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,51200,0.5021440188090006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,12288,0.2731786568959554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,32,32,1024,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,10240,0.2278817759619819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,10240,0.11216889487372504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,8192,0.18556622664133707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,8192,0.09678044584062363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,51200,1.1156835556030273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,7168,0.11413955688476562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,6144,0.1386622190475464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,5120,0.11608444319831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,6144,0.08631466494666205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,4096,0.09636888901392619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,3584,0.08346133099661933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,4096,0.06765333149168226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,3072,0.07215911149978638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,5120,0.08450933297475179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,3584,0.061181333329942494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,2560,0.060532444053226046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,2048,0.04944088723924425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,2560,0.049082666635513306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,1536,0.03755999935997857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,12288,0.1307955582936605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,1024,0.02743822170628442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,3072,0.05568799707624647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,2048,0.04014755619896783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,1536,0.03458666801452637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,768,0.020616888999938965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,512,0.014409777190950183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,256,0.008994667066468133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,7168,0.16159378157721624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,768,0.022484444909625586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,512,0.01886044442653656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,64,0.0042204442951414315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,256,0.016161777906947665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,32,0.004550222307443619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,64,0.014808000789748298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,128,0.013767999907334646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,32,0.015114666687117683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,51200,0.4036782317691379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,65536,0.5263937844170464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,16384,0.2700515588124593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,12288,0.2037342256969876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,16384,0.13999911149342856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,51200,0.8273733456929525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,65536,128,0.006274666637182236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,65536,1.094936900668674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,65536,1024,0.026521777113278706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,12288,0.10714577966266209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,8192,0.1394408941268921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,7168,0.12440710597568089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,6144,0.105785780482822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,10240,0.09204266468683879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,8192,0.07927555508083768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,7168,0.08105333646138509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,5120,0.08883733219570583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,4096,0.07309422228071424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,6144,0.07004800107744005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,3584,0.06479022237989637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,3584,0.05204800102445814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,2560,0.046579556332694165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,3072,0.04646133383115133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,2560,0.040829333994123675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,1536,0.030446221431096394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,3072,0.055824889077080615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,5120,0.07194666730033027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,1024,0.02201955517133077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,768,0.016524444023768108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,2048,0.03498133354716831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,4096,0.055085334512922496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,512,0.011696000066068439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,256,0.00793866647614373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,768,0.020597333709398907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,128,0.004567111117972268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,256,0.014780445231331719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,64,0.00387999994887246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,128,0.013796444568369122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,10240,0.1724568870332506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,32,0.0042204442951414315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,64,0.01441511180665758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,32,0.014386667145623101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,65536,0.33270666334364146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,65536,0.19238666693369547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,51200,0.2613351080152723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,16384,0.08402399884329902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,51200,2048,0.03829955392413669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,51200,0.14356888665093318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,12288,0.06325866778691609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,10240,0.053824888335333936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,16384,0.05746666590372721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,1024,0.023333332604832117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,8192,0.045088890526029796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,10240,0.04013244311014811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,7168,0.03875733415285746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,512,0.01751733322938283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,6144,0.03353066576851739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,5120,0.029622223642137315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,7168,0.03847466574774848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,4096,0.024401777320437964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,6144,0.0355386667781406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,3584,0.02159022291501363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,5120,0.03103999959097968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,3072,0.01888533267709944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,4096,0.027298667364650305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,2560,0.016148444679048326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,2048,0.013423999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,3584,0.02642400066057841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,1536,0.011028444601429833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,2560,0.022298667165968154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,2048,0.019543111324310303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,1024,0.008641777767075432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,768,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,1024,0.015125332607163323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,512,0.005224888937340842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,768,0.014502222339312235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,256,0.003540444291300244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,51200,1536,0.028561777538723413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,256,0.01254755589697096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,128,0.0032186667538351486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,64,0.0032044444233179092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,12288,0.04508622156249153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,16384,32,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,128,0.012077333198653327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,64,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,8192,0.03611022233963013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,32,0.01203644441233741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,65536,0.2559555636511909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,51200,0.20068889194064668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,65536,0.15978222423129612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,16384,0.07206844621234469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,51200,0.12457777394188775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,12288,0.055849777327643506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,16384,0.04988444513744778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,1536,0.017795556121402316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,12288,0.040397332774268255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,8192,0.040022220876481794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,10240,0.03633600142267015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,7168,0.035523557000690036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,6144,0.031311998764673867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,8192,0.03273955649799771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,5120,0.027672888504134283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,7168,0.037631998459498085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,4096,0.020624000165197585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,6144,0.03051555487844679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,512,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,3584,0.01772177716096242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,5120,0.027403554982609216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,3072,0.015799111790127225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,2560,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,4096,0.02387111054526435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,2048,0.011672000090281168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,3584,0.0236791107389662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,1536,0.009692444569534725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,1024,0.008271999657154083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,2560,0.02053244411945343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,2048,0.0188426673412323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,768,0.006554666492674086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,1536,0.01755644381046295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,512,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,256,0.00397866674595409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,1024,0.01477599971824222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,128,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,768,0.013831111292044321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,512,0.013148444394270578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,64,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,256,0.011688888900809817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,128,0.011047110789351992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,64,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,32,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,16384,3072,0.02392888896995121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,10240,0.04719733198483785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,65536,0.21899822023179796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,51200,0.1741422282324897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,16384,0.06174933248096042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,65536,0.15219377146826849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,51200,0.11945245001051162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,10240,0.042303111818101674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,16384,0.0488302210966746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,12288,0.03906133439805772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,8192,0.036729776197009616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,7168,0.0323022206624349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,10240,0.03532000051604377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,6144,0.028012444575627644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,8192,0.031345778041415744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,12288,3072,0.022037333912319605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,5120,0.024173332585228816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,4096,0.01833066675398085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,7168,0.030704001585642498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,3584,0.016162667009565566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,6144,0.027726221415731642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,3072,0.01458044515715705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,5120,0.02568622264597151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,4096,0.0214373336897956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,2560,0.01254488858911726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,3584,0.021331555313534204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,2048,0.011009777585665384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,1536,0.00905777762333552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,1024,0.0075288886825243635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,12288,32,0.003072888900836309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,2048,0.017543110582563613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,768,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,1536,0.016011555989583332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,1024,0.013448889056841532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,256,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,768,0.013242666920026144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,512,0.01272266689274046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,128,0.0032799999333090256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,64,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,256,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,32,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,128,0.011032000184059143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,64,0.011063999599880643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,12288,0.049138665199279785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,32,0.011413333316644033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,65536,0.17468267016940645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,65536,0.10281422403123643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,51200,0.1400560008154975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,51200,0.08120355341169569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,12288,0.033414221472210355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,10240,0.028100444210900202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,16384,0.03661244445376926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,12288,0.030128889613681372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,8192,0.023743111226293776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,7168,0.02085688875781165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,2560,0.019072888625992667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,10240,0.027230223019917805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,10240,3072,0.020596444606781006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,6144,0.01854222185081906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,10240,512,0.004621333132187526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,5120,0.016146666473812528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,7168,0.024496888120969135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,4096,0.013714666995737286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,6144,0.02290577855375078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,3584,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,3072,0.011055111057228513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,5120,0.022198221749729578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,4096,0.019708444674809773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,3584,0.019096000327004325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,3072,0.017653332816229928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,1536,0.007238222493065729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,2048,0.015623110863897534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,1024,0.005574222240183089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,1536,0.013919111755159167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,768,0.0040702223777771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,1024,0.013086222112178802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,16384,0.042048000627093844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,512,0.0036559998989105225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,256,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,512,0.01239377756913503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,256,0.011361777782440186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,128,0.003216000066863166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,64,0.0028826666788922418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,128,0.010679999987284342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,32,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,8192,0.02365333338578542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,32,0.011704000333944956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,65536,0.15171733167436388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,2560,0.00978577799267239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,8192,2048,0.008571555217107138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,16384,0.043783999151653714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,65536,0.09502577781677246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,12288,0.03451822201410929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,51200,0.07464977767732409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,10240,0.029715554581748113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,16384,0.034352001216676496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,8192,0.022481777601771887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,12288,0.028526223368114893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,768,0.012763555679056378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,10240,0.025684444440735713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,7168,0.018896889355447557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,6144,0.01681066718366411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,7168,0.023968888653649226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,5120,0.014692443940374585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,6144,0.021722666091389124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,4096,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,64,0.011076444553004371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,5120,0.020269332660569083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,3584,0.011113777756690979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,3072,0.010045333041085137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,3584,0.01864088906182183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,2560,0.009007111191749573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,3072,0.017498667041460674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,2048,0.007648888561460707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,8192,2560,0.017483555608325534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,2560,0.01714933415253957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,1536,0.006634666687912411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,1024,0.004951999833186467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,2048,0.01478488908873664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,768,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,1536,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,512,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,1024,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,256,0.003236444460021125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,768,0.01275466630856196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,128,0.0028782222006056043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,512,0.012410666379663678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,8192,0.022648000054889258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,64,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,32,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,128,0.010747555229398938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,64,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,32,0.012031111452314587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,65536,0.12744443946414524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,51200,0.10094310839970906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,65536,0.09009333451588948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,4096,0.018862222631772358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,51200,0.06810577710469563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,16384,0.03809066613515218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,12288,0.030373334884643555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,10240,0.02604088849491543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,16384,0.03233688738611009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,8192,0.021967111362351313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,12288,0.026205332742797002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,10240,0.023244443866941664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,7168,0.01997511088848114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,7168,51200,0.12093688382042779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,6144,0.01755466726091173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,8192,0.021212443709373474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,7168,0.022686221533351477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,6144,0.021192888418833416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,5120,0.01550222271018558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,5120,0.019152889649073284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,3584,0.010323555933104621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,3072,0.00943022221326828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,2560,0.008390222158696916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,4096,0.018167111608717177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,3584,0.01772533357143402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,2048,0.0075795559419526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,1536,0.006267555471923616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,2560,0.01590666671593984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,7168,256,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,1024,0.004276444514592488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,768,0.0038853333228164246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,2048,0.014155555102560254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,512,0.0034471110751231513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,1024,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,256,0.003253333270549774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,768,0.012446222205956778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,128,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,512,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,64,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,32,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,256,0.011027555498811932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,128,0.01072177787621816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,64,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,65536,0.1079368856218126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,32,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,51200,0.08642666869693333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,16384,0.03227377931276957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,65536,0.07909066809548272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,12288,0.026155556241671245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,10240,0.022823111878501043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,51200,0.0629040002822876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,16384,0.029862221744325426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,8192,0.019959110352728102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,12288,0.023690667417314317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,6144,4096,0.012608889076444836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,7168,0.017670222454600863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,10240,0.021956443786621094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,6144,0.015750222735934787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,5120,0.014118222726715935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,8192,0.02070844504568312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,4096,0.010864888628323873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,6144,0.020228443874253165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,3584,0.009739555418491364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,3072,0.01717155509524875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,5120,0.018936889039145578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,4096,0.01789155602455139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,3584,0.017343110508388944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,2560,0.007652444144090016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,6144,1536,0.013463111387358772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,3072,0.016137777103318107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,2048,0.006959111326270633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,1536,0.006233777850866318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,1024,0.004787555585304896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,2560,0.014814222852389017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,2048,0.014171555638313293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,1536,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,768,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,512,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,1024,0.012431999875439538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,256,0.003216000066863166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,128,0.0028799999919202593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,768,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,512,0.011878222227096558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,64,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,256,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,128,0.010334221853150262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,64,0.010791111323568555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,65536,0.08907822105619644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,32,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,51200,0.07141155666775174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,16384,0.026800000005298193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,12288,0.02127555509408315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,51200,0.05835555659400093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,10240,0.01865688959757487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,16384,0.026532444689008925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,5120,7168,0.02198666665289137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,8192,0.016351110405392118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,7168,0.014020444618331062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,5120,3072,0.008952889177534316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,10240,0.020915556285116408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,6144,0.012506666282812754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,8192,0.01992266707950168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,5120,0.011090666883521609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,7168,0.020346666375796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,4096,0.009724444813198512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,6144,0.01904622217019399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,3584,0.009054222040706212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,3072,0.008344888687133789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,5120,0.017860444055663217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,2560,0.0074684446056683855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,4096,0.017186666528383892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,3584,0.01591377788119846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,2048,0.006279110908508301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,1536,0.004925333377387789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,2560,0.014472888575659858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,1024,0.0038808890514903595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,2048,0.013703111145231458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,1536,0.013086222112178802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,768,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,512,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,1024,0.012489777472284106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,256,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,768,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,512,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,128,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,64,0.002842666581273079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,256,0.011185777684052786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,4096,32,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,128,0.010612444745169746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,64,0.010694222317801582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,65536,0.07719466421339247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,12288,0.022443556123309668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,32,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,51200,0.06174577607048882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,16384,0.02481422159406874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,65536,0.07032355335023668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,12288,0.01975022256374359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,51200,0.056672890981038414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,10240,0.01718933383623759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,16384,0.02532177832391527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,8192,0.014759999182489185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,12288,0.021941334009170532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,7168,0.013435555828942193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,6144,0.01202488856183158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,10240,0.020612445142534044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,8192,0.019312888383865356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,5120,0.010612444745169746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,3072,0.0151573336786694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,4096,0.009927999642160203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,3584,0.008616000413894653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,6144,0.018175111876593698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,3072,0.008039111064540016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,4096,0.01644088824590047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,3584,0.015230221880806817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,2560,0.006945778098371293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,2048,0.006267555471923616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,3072,0.01428711083200243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,1536,0.004867555366622077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,2560,0.014098667436175875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,4096,65536,0.0738204452726576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,2048,0.013808888693650564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,768,0.0038773334688610504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,1536,0.012780444489585029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,512,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,1024,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,768,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,256,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,512,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,128,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,256,0.011791999969217511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,64,0.002847111059559716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,32,0.0026462222966882917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,128,0.010355555348926121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,64,0.011624889241324531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,65536,0.06830933358934191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,7168,0.019536889261669584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,32,0.011372444530328115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,51200,0.05287555522388882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,16384,0.02125511070092519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3584,5120,0.016978666186332703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,65536,0.06838666730456881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,12288,0.01806311143769158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,51200,0.054874665207333036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,10240,0.015489778584904142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,8192,0.013587555951542325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,12288,0.021436444587177698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,7168,0.013073777986897362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,10240,0.020281778441535104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,6144,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,8192,0.01869066721863217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,5120,0.011012444065676795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3584,1024,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,4096,0.009992889232105678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,7168,0.018931556079122756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,3584,0.008291555775536431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,3072,0.00757155567407608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,5120,0.01704266667366028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,2560,0.007311999797821045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,4096,0.014789332946141561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,3584,0.014676445060306124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,2048,0.0058853332367208265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,1536,0.005606222069925732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,3072,0.014142221874660917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,1024,0.004585777719815572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,2560,0.013815110756291283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,2048,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,768,0.0038986665507157645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,512,0.003560888684458203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,1536,0.0127697777416971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,256,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,1024,0.012313777373896705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,768,0.012148444851239523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,128,0.002875555513633622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,512,0.011766222616036734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,64,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,3072,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,256,0.011399110986126794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,128,0.010686222049925061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,64,0.01069155583779017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,65536,0.06042666567696465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,32,0.010681777364677854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,51200,0.04696089029312134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,16384,0.0192577772670322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,12288,0.015558222929636637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,65536,0.06533333328035143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,10240,0.01399466726515028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,16384,0.024337778488794964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,12288,0.02131555477778117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,8192,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,7168,0.011686222420798408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,10240,0.019719110594855416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,6144,0.010674667027261523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,6144,0.017309332887331646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,8192,0.01851111153761546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,5120,0.010041777458455827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,7168,0.018696889281272888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,4096,0.008692444198661381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,6144,0.016932444439993966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,3584,0.00795288880666097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,5120,0.01518133282661438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,3072,0.007743111087216272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,2560,0.006730666591061487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,4096,0.014472888575659858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,2048,0.005552000055710475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,3072,0.013572444518407186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,1536,0.005336888962321811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,2048,0.01278133359220293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,1024,0.0041857775714662345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,1536,0.012500444220172035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,768,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,1024,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,512,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,768,0.012122666670216454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,256,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,512,0.011866666376590729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,3072,16384,0.024728000164031982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,128,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,64,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,256,0.011284444067213269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2560,32,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,128,0.01034222212102678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,64,0.0107022225856781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,32,0.010876444478829702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,51200,0.03831200136078729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,65536,0.06346311171849568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,3584,0.014107555150985718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,16384,0.01831999917825063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,2560,0.013726222018400827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,51200,0.05163822240299649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,12288,0.014870221416155497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,16384,0.023949333363109167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,10240,0.013591999808947245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,8192,0.012173333101802401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,12288,0.020640000700950623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,7168,0.01130488928821352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,10240,0.019384000036451552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,8192,0.017811555001470778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,7168,0.017222222354676988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,5120,0.009679999616410997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2560,51200,0.05298577745755514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,6144,0.015593777100245157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,4096,0.008349333372380998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,3584,0.007259555160999298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,5120,0.014781332678265043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,3072,0.006650666809744305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,3584,0.01408088869518704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,65536,0.04885688755247328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,2048,0.0052044445441828836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,3072,0.013487111363146039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,2560,0.01313688854376475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,2048,0.012431999875439538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,1024,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,1536,0.012708444562223224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,768,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,1024,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,512,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,768,0.01238044434123569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,256,0.003126222226354811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,512,0.011746666497654386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,128,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,6144,0.010660444696744284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,256,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,64,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,32,0.0028035555862718155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,128,0.01035377797153261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,64,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,65536,0.038219554556740656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,32,0.011047110789351992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,51200,0.030084444416893855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,16384,0.01349955548842748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,2560,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,12288,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,16384,0.02332088847955068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,2048,1536,0.004583111239804162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,10240,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,12288,0.020257777637905545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,8192,0.015448000695970325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,7168,0.010904889139864178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,10240,0.018826666805479262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,8192,0.01684977776474423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,6144,0.010846222440401712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,5120,0.009695111049546136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,7168,0.015805333852767944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,4096,0.008348444269763099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,6144,0.015226667126019796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,3584,0.007947555846638149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,4096,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,3072,0.006569777925809224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,3584,0.013776000175211163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,2560,0.005605333381228977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,3072,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,2048,0.004930666751331753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,2560,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,1536,0.00452888881166776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,2048,4096,0.014168888330459595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,2048,0.01257599973016315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,1024,0.003980444537268745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,768,0.003536000019974179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,51200,0.05001066790686714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,1536,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,512,0.003216000066863166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,1024,0.01182044463025199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,256,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,128,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,768,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,512,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,64,0.002514666567246119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1536,32,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,256,0.011006222003036074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,128,0.010467555787828235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,65536,0.027318222655190363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,64,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,51200,0.02381955583890279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,32,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,16384,0.012348444097571902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,65536,0.05819288889567057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,12288,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,10240,0.010378667049937779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,51200,0.047855999734666615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,8192,0.009328888522254096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,16384,0.022894221875402663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,5120,0.014787554740905762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,7168,0.008671110702885522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,6144,0.008975110948085785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,10240,0.01769333415561252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,5120,0.008208889100286696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,8192,0.016554666890038382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,4096,0.007283555964628856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,6144,0.015169777803950839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,3584,0.006899555524190267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,5120,0.014496000276671516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,3072,0.006267555471923616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,4096,0.014148443937301636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,2560,0.005635555419656966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,3584,0.013682666752073499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,2048,0.0058711109062035876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,3072,0.013406222065289816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1536,65536,0.06128799915313721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,2560,0.013287111288971372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,1024,0.003913777983850903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,2048,0.012448000411192576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,768,0.0038328886859946777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,1536,0.012431110772821637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,1024,0.012148444851239523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,256,0.0031999999450312722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,768,0.012033777932325998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,128,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,512,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,256,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,32,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,128,0.010346666806273991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,65536,0.023969777756267126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,64,0.011004444625642566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,12288,0.0192266669538286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,51200,0.019526221685939364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,32,0.011215111447705163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,16384,0.011026666396194033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,12288,0.011167999770906238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,1024,7168,0.015807110402319167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,65536,0.05663022067811754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,51200,0.04624888963169522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,8192,0.008828444613350762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,12288,0.018940443793932598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,10240,0.017515555024147034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,7168,0.00794666674402025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,6144,0.00832622249921163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,8192,0.016140444411171805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,5120,0.00794577764140235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,7168,0.015560888581805758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,6144,0.015264888604482016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,4096,0.007263999846246507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,3584,0.006960888703664144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,5120,0.014155555102560254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,3072,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,4096,0.013810666898886362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,3584,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,3072,0.012907555533779992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,2048,0.005221333354711533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,2560,0.012839111189047495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,1536,0.004502222355869082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,2048,0.01238933371173011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,1024,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,1536,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,768,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,1024,0.011414222419261932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,512,0.003145777723855443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,10240,0.009655999640623728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,256,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,512,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,128,0.0026488889836602737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,256,0.010703999963071613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,64,0.00254488881263468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,1024,1536,0.00519466648499171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,128,0.010354667074150508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,32,0.002516444358560774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,65536,0.01777066621515486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,32,0.011001778145631155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,768,2560,0.00555377784702513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,65536,0.055380443731943764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,16384,0.01039644413524204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,51200,0.045837332804997764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,12288,0.01034311122364468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,16384,0.02093511157565647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,10240,0.00866844422287411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,12288,0.018930666976504855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,8192,0.008270222279760573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,10240,0.017504889104101393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,7168,0.009009777671760982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,6144,0.008555555509196388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,16384,0.021645334031846788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,5120,0.007991111112965478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,7168,0.01584533353646596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,4096,0.007251555720965068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,6144,0.015392889579137167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,3584,0.0069057775868309875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,5120,0.01479555500878228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,3072,0.006312888943486744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,4096,0.013468444347381592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,2560,0.005607111172543631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,3584,0.014088888963063559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,2048,0.005051555732885997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,64,0.01035733355416192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,3072,0.013459555804729462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,1536,0.004602666530344221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,51200,0.015995555453830294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,2048,0.01273333364062839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,1024,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,768,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,1536,0.012755555411179861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,512,0.0032382222513357797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,1024,0.011977777712874942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,256,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,512,0.01179377817445331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,128,0.0028853333658642242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,256,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,64,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,512,32,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,128,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,768,768,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,8192,0.016167110866970487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,32,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,51200,0.014921777778201632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,16384,0.009363555245929295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,65536,0.05374755462010702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,12288,0.009489778015348647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,51200,0.044215109613206655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,10240,0.008728000024954477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,16384,0.020938666330443487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,8192,0.007676444119877285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,12288,0.0185253338681327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,7168,0.007303111255168915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,10240,0.017864000466134813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,2560,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,6144,0.007319110963079665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,8192,0.016153777639071148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,5120,0.0069102222720781965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,4096,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,7168,0.015474667151769003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,6144,0.014837332897716098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,3584,0.006626666833957036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,5120,0.014488889111412896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,3072,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,2560,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,4096,0.01404266721672482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,768,0.011773332953453064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,3584,0.013780444032616086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,2048,0.006083555519580841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,1536,0.004219555606444676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,3072,0.01314399970902337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,1024,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,2560,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,768,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,512,0.003133333391613431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,1024,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,768,0.011767999993430244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,256,0.003124444435040156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,512,64,0.011300444602966309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,128,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,512,0.011384000380833944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,64,0.002475555572244856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,32,0.002519999941190084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,256,0.010699555277824402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,128,0.011427555647161273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,65536,0.01690933273898231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,51200,0.014189332723617554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,32,0.010692444112565784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,16384,0.008620444271299574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,65536,0.052151110437181264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,12288,0.007651555869314406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,51200,0.04242222176657783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,16384,0.020928889513015747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,12288,0.01888444523016612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,8192,0.0069120000633928515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,10240,0.01745244363943736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,7168,0.006582222051090664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,8192,0.016332444217469957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,6144,0.006589333216349284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,7168,0.015808888607554965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,5120,0.005883555445406172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,2048,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,1536,0.01254755589697096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,4096,0.005960888746711943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,6144,0.015124445160230001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,3584,0.005718222094906702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,5120,0.014444443914625378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,256,65536,0.015799999237060547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,4096,0.014117333624098035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,2560,0.005972444597217772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,3584,0.013746666411558786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,2048,0.005979555762476391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,1536,0.004544888933499654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,256,64,0.010381333529949188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,2560,0.013392888837390475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,2048,0.012738666600651212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,1024,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,768,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,1536,0.012800888882742988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,512,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,256,0.0029306666304667792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,1024,0.011828444070286222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,768,0.011432888607184092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,128,0.0025351111673646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,10240,0.007272000114123027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,512,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,64,0.002487999904486868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,256,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,128,0.010377777947319878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,65536,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,64,0.01144444445768992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,32,0.011092444260915121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,16384,0.00796622203456031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,65536,0.051013333929909595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,12288,0.007292444507280986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,51200,0.04283644424544441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,10240,0.007136888802051544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,16384,0.02128177715672387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,8192,0.006637333167923822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,12288,0.018791110979186166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,7168,0.006462222172154321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,10240,0.017883555756674874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,128,3072,0.005543111099137201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,6144,0.005977777971161737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,8192,0.016203555795881484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,5120,0.006051555689838197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,4096,0.005647111270162795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,7168,0.015512888630231222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,6144,0.014947555131382413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,3584,0.00611111107799742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,3072,0.005587555468082428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,5120,0.014450665977266101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,2560,0.006232000059551663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,4096,0.014135999812020196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,2048,0.005935110979610019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,3584,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,3072,0.013063111239009433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,1536,0.004224888980388641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,1024,0.0038746665749284956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,2560,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,2048,0.012822222378518848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,768,0.0033191111352708605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,512,0.0032506665835777917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,1024,0.011689778003427716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,256,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,768,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,51200,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,128,0.0024951110697454875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,64,0.00249422217408816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,256,0.010704889065689512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,64,32,0.0024782222592168385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,128,0.009992889232105678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,64,0.01109333336353302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,65536,0.012421333127551608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,51200,0.010686222049925061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,32,0.010323555933104621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,16384,0.00758755538198683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,65536,0.05165511038568285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,12288,0.007325333025720384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,16384,0.02077511118517982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,10240,0.006952889263629913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,128,3072,0.013291555146376291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,12288,0.01887911061445872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,8192,0.006248888870080312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,7168,0.006581333362393909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,10240,0.017210667332013447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,6144,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,8192,0.01648355523745219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,5120,0.005910222315125995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,7168,0.01570399933391147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,4096,0.005572444448868434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,6144,0.014833778142929077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,1536,0.012426666915416718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,3584,0.005921777751710679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,5120,0.014495111174053617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,3072,0.0053093334039052325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,2560,0.005601777798599667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,4096,0.013767999907334646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,64,512,0.012082666986518435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,3584,0.013432000246312885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,3072,0.013427555561065674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,1536,0.004208000169859992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,1024,0.003544888976547453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,2560,0.012789333032237159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,768,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,2048,0.012759110993809171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,1536,0.01239466667175293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,512,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,1024,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,768,0.011715555356608497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,128,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,512,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,64,0.0026373333401150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,51200,0.04227466715706719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,32,0.002465777720014254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,128,0.010330666270520952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,64,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,32,0.010405333505736457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,51200,0.5003324614630805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,16384,0.3261137803395589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,256,0.0028515555378463534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,51200,0.9711884392632378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,16384,0.17223733001285127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,17,32,256,0.010743111371994019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,12288,0.2274248864915636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,12288,0.13089956177605525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,10240,0.18896267149183485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,10240,0.11263377136654323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,17,32,2048,0.0053297777970631914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,8192,0.15509866343604192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,8192,0.0971377756860521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,7168,0.13433599472045898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,7168,0.09807911184098984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,12288,0.2128995524512397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,10240,0.1824320024914212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,6144,0.11582756042480469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,16384,0.27906666861640084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,5120,0.09734044472376506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,6144,0.08721333079867893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,8192,0.15187733703189427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,4096,0.08169777525795831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,5120,0.08125333653555976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,7168,0.1551377773284912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,4096,0.06538222233454387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,3584,0.06954399744669597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,6144,0.15904800097147623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,3584,0.05766044722663032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,5120,0.16957333352830675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,3072,0.0603075557284885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,2560,0.051170667012532554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,4096,0.10008711285061306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,3072,0.05053244365586174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,2048,0.04213688770929972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,2560,0.044891556104024254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,3584,0.1059102217356364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,1536,0.032736887534459434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,3072,0.08694755368762547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,2048,0.03797600004408095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,2560,0.07565510935253568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,1024,0.023688889212078516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,2048,0.0673688915040758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,1536,0.03389511174625821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,1024,0.02388266722361247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,1536,0.05655644337336222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,512,0.0136808885468377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,768,0.022104000051816303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,768,0.04084800018204583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,256,0.008278222547637092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,512,0.018578666779730055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,128,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,256,0.032567110326555036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,256,0.0158595558669832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,64,0.005592888842026393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,128,0.014515555567211576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,32,0.005920889063013925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,64,0.015154666370815702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,65536,32,0.016757332616382174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,65536,768,0.018626666731304593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,65536,0.5275875727335612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,512,0.039621333281199135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,65536,1.0897262361314561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,51200,0.8486035664876302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,51200,0.4029448827107747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,16384,0.2803368833329943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,51200,0.850789335038927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,16384,0.14056532912784153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,12288,0.20871110757191977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,1024,0.04634755518701342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,12288,0.10699199967914158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,10240,0.17314488357967803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,10240,0.09203110800849067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,65536,128,0.02772444486618042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,8192,0.13957244820064968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,8192,0.07871911260816786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,7168,0.12182754940456814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,12288,0.1836764415105184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,7168,0.08298666609658135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,10240,0.15732533401913112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,8192,0.13129956192440456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,6144,0.1046782202190823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,16384,0.23352445496453178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,5120,0.08947822120454575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,5120,0.06493688954247369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,4096,0.07302488883336385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,7168,0.12379554907480876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,4096,0.05340266558859083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,6144,0.11613510714636908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,3584,0.06488088766733806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,5120,0.14008177651299372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,3072,0.05672622389263577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,3584,0.04812444580925835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,4096,0.0840231113963657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,2560,0.04699288805325826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,3072,0.04716533422470093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,2048,0.03773422373665704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,3584,0.0993466642167833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,2560,0.038000000847710505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,3072,0.07179733117421468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,1536,0.029879109727011785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,2048,0.03525155451562669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,2560,0.06357066498862372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,1024,0.021632888250880774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,1536,0.027373333772023518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,6144,0.07230577866236369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,768,0.01623288955953386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,1536,0.04970399869812859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,1024,0.02068444424205356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,1024,0.04165600074662103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,512,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,768,0.01869244376818339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,256,0.007576888634098901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,512,0.016935111747847665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,512,0.033137778441111244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,128,0.004644444419278039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,256,0.013796444568369122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,256,0.030264000097910564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,64,0.0035377778112888336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,128,0.024925332930352952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,51200,32,0.003546666767862108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,64,0.014107555150985718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,32,0.014834667245546976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,65536,0.32238488727145725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,2048,0.062018666002485484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,65536,0.18853955798678926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,51200,0.7005288865831164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,768,0.037478221787346735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,51200,0.2529208925035265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,51200,0.14253689183129206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,16384,0.09122666385438706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,12288,0.07147555881076388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,51200,128,0.012430222498046027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,16384,0.057032002343071826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,51200,65536,0.9048293431599935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,12288,0.04506399896409777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,10240,0.05344177616967095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,16384,0.07112533516354032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,8192,0.04441155658827888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,12288,0.05901600254906548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,7168,0.03895377781656053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,8192,0.03644444545110067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,10240,0.05375111103057861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,8192,0.04886044396294487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,6144,0.03331644336382548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,7168,0.03760977917247348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,5120,0.029114666912290785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,6144,0.03623111049334208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,7168,0.045759999089770846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,4096,0.024724443753560383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,6144,0.045399109522501625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,5120,0.03126577867401971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,5120,0.040440890524122454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,3584,0.021518222159809534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,51200,0.157078226407369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,4096,0.03811555438571506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,3072,0.018917333748605516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,3584,0.025472889343897503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,3584,0.034733331865734525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,4096,0.02679555614789327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,65536,0.20070577992333305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,2560,0.01609688831700219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,2048,0.013099555340078143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,3072,0.03304533494843377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,2560,0.020290666156344943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,3072,0.02330488959948222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,1536,0.01036711119943195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,2048,0.029727111260096233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,1024,0.008720888859695857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,2048,0.019350222415394254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,768,0.007121777368916406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,10240,0.042457779248555504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,1536,0.02784622377819485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,1536,0.01779111060831282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,512,0.005607111172543631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,1024,0.025115556187099878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,1024,0.014763555592960782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,256,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,768,0.013749333719412485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,768,0.023095111052195232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,512,0.021720889541837905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,128,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,512,0.012456888953844706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,256,0.019904888338512845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,256,0.011416888899273343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,32,0.0031911111954185697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,128,0.019211555520693462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,128,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,64,0.011086222198274402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,16384,32,0.012103999654452005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,65536,0.25226932101779515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,65536,0.157279994752672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,51200,0.19970488548278809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,51200,0.12433689170413548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,16384,0.06742933061387804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,12288,0.05243822269969516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,16384,0.05009955498907301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,16384,2560,0.03120622369978163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,12288,0.040488001373079084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,16384,0.06124533547295464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,12288,0.052448001172807485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,10240,0.036271999279658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,8192,0.03792000148031447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,16384,64,0.002797333316670524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,10240,0.04769600099987454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,7168,0.033259554041756526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,8192,0.032999111546410456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,8192,0.04350044329961141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,7168,0.0344124436378479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,6144,0.02908888790342543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,7168,0.04335022303793165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,65536,0.16678755813174775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,5120,0.025721778472264607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,6144,0.031672000885009766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,51200,0.13209244940016004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,4096,0.022608000371191237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,6144,0.03981599873966641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,3584,0.020000000794728596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,5120,0.0368115570810106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,5120,0.027611555324660406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,4096,0.024889777104059856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,3072,0.01776444415251414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,4096,0.03388533327314589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,2560,0.012420444852775998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,3584,0.03296622302797105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,3584,0.022664889693260193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,3072,0.021320000290870667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,10240,0.04463288850254483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,3072,0.032234665420320295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,2560,0.03086400032043457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,1536,0.009164444274372524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,2048,0.028429332706663344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,2048,0.01813066667980618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,1024,0.007968000239796108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,1536,0.016537777251667447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,768,0.006739555547634761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,1024,0.023538667294714186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,1536,0.0280675556924608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,512,0.00452888881166776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,768,0.013743999931547375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,768,0.022114665971861944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,256,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,512,0.01275466630856196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,512,0.021632888250880774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,128,0.0032248888164758682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,256,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,256,0.021287999219364587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,64,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,12288,128,0.018223999275101554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,128,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,32,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,64,0.01202755586968528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,32,0.01240888900227017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,12288,2048,0.010663111176755695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,2560,0.01961599952644772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,65536,0.1552168925603231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,51200,0.174291557735867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,16384,0.0605493320359124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,51200,0.11882844236161973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,12288,1024,0.013463111387358772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,12288,0.0469706654548645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,16384,0.048375109831492104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,12288,0.03917155663172404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,10240,0.038896001047558255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,16384,0.05790577994452583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,12288,0.05073422193527222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,10240,0.03491555651028951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,8192,0.03256622287962172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,10240,0.04572977622350057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,7168,0.029294222593307495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,8192,0.031339555978775024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,65536,0.15417510933346218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,65536,0.21863110860188803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,6144,0.02632444434695774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,8192,0.0414284434583452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,5120,0.02295733326011234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,7168,0.029492444462246362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,7168,0.04103911254141066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,6144,0.028033776415718928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,5120,0.024009777439965144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,4096,0.01978488928741879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,6144,0.03828710979885525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,5120,0.03509689039654202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,3584,0.017454221844673157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,3072,0.015726221932305228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,4096,0.022478222846984863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,4096,0.034295111894607544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,3584,0.03178044491344028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,2560,0.012358222570684222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,3072,0.019273777802785236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,3072,0.030819555123647053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,2560,0.018935999936527677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,2560,0.029790222644805908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,1536,0.009226666556464301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,2048,0.02769333289729224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,2048,0.01700177788734436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,1024,0.007232888705200619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,1536,0.02696177860101064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,1536,0.016020443704393175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,768,0.00554044461912579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,1024,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,1024,0.022288888692855835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,512,0.0047324444684717385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,768,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,768,0.02217866645918952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,256,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,512,0.020253333780500624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,512,0.012112889024946423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,128,0.0035208890007601846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,51200,0.12512621614668104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,256,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,256,0.019554666346973844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,64,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,32,0.0029804443733559716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,128,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,10240,128,0.019208000765906442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,64,0.010794666906197866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,32,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,65536,0.17469688256581625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,10240,3584,0.021134222547213238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,65536,0.10347021950615777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,51200,0.08050133122338189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,16384,0.04582488867971632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,12288,0.032912890116373696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,16384,0.0366248885790507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,12288,0.030248890320460003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,16384,0.057583113511403404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,10240,0.027726221415731642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,12288,0.0494026674164666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,10240,0.027441778116756018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,8192,0.023749333288934495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,10240,0.045666668150160045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,65536,0.15080089039272732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,7168,0.020544000797801547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,51200,0.12345155080159505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,8192,0.02380888826317257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,6144,0.018177777528762817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,8192,0.04207466708289253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,5120,0.015965332587560017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,7168,0.03933155536651611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,6144,0.02267644471592373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,6144,0.03673422336578369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,4096,0.013566222455766467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,5120,0.03499822152985467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,51200,0.13207377327813044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,5120,0.020621332857343886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,3584,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,10240,2048,0.010536889235178629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,4096,0.019336889187494915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,3072,0.010982222027248807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,2560,0.009639110830095079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,3584,0.03137422270245022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,3072,0.03012266755104065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,3072,0.017879999346203275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,2048,0.008610666626029545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,2560,0.016719111137919955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,2560,0.029214223225911457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,1536,0.007589333587222629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,2048,0.02825511164135403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,2048,0.015822221835454304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,1024,0.005410666680998272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,1536,0.02415200074513753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,1536,0.013811555173661975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,768,0.004562666846646203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,1024,0.013092444174819522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,1024,0.02207022243075901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,512,0.003867555409669876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,768,0.021312889125612047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,768,0.012120000190205045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,256,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,512,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,512,0.021662222014533147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,128,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,256,0.011400889191362592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,256,0.020248000820477802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,64,0.0026275554878844153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,128,0.01886666648917728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,128,0.011386666860845355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,8192,32,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,64,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,32,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,65536,0.14962311585744223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,8192,4096,0.03348088926739163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,51200,0.11844355530209011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,3584,0.01851111153761546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,16384,0.04217244519127739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,51200,0.07445600297715929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,12288,0.03356800145573086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,16384,0.034663110971450806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,12288,0.028798222541809082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,16384,0.056411557727389865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,10240,0.028322666883468628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,12288,0.04856444398562113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,8192,0.02194044490655263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,10240,0.025231111380789015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,10240,0.046329776446024575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,51200,0.12307111422220866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,65536,0.1517688830693563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,7168,0.01900800069173177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,6144,0.01676977839734819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,8192,0.022673777408070032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,8192,0.04026755690574646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,8192,7168,0.02467022173934513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,7168,0.039055999782350324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,5120,0.014527110589875115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,7168,0.02399377855989668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,6144,0.03638044330808852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,6144,0.022014222211307947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,4096,0.012706666356987424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,5120,0.03439377744992574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,3584,0.011042666931947073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,5120,0.020294222566816542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,65536,0.09512888722949558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,4096,0.033913777934180364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,3072,0.009957333405812582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,2560,0.008940444224410588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,3584,0.032572444942262434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,3584,0.018227555685573153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,3072,0.031178666485680476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,3072,0.01717688971095615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,2048,0.0076453329788313965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,1536,0.007242666350470648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,2560,0.015995555453830294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,2048,0.025742222865422566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,2048,0.01516533394654592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,1024,0.004938666605287128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,1536,0.024335111180941265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,1536,0.013482666677898832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,768,0.004200889004601372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,1024,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,1024,0.021617778473430212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,512,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,768,0.011867555479208628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,256,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,512,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,512,0.02162488963868883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,128,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,256,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,256,0.01963644391960568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,64,0.0030088888274298776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,128,0.011413333316644033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,128,0.018523555662896898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,7168,32,0.0027271111806233725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,64,0.011028444601429833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,65536,0.1239946683247884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,32,0.011372444530328115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,7168,4096,0.01887822151184082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,51200,0.09746844238705105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,65536,0.08865777651468913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,16384,0.035918222533331975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,2560,0.029735998974906072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,16384,0.032524443335003324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,12288,0.02888622217708164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,16384,0.057118223773108594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,7168,768,0.020974222156736586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,10240,0.02500444485081567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,12288,0.026518222358491685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,12288,0.04976355698373583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,65536,0.15115555127461752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,51200,0.1229119963116116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,8192,0.021291555629836187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,10240,0.023927999867333308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,7168,0.019388443893856473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,10240,0.04481866624620226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,8192,0.021894221504529316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,8192,0.040136890278922185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,7168,0.03949688871701559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,5120,0.015065777632925244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,6144,0.036271111832724676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,6144,0.0214044451713562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,4096,0.011855999628702799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,5120,0.020264888803164165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,5120,0.03456177645259433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,3584,0.010606221854686737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,51200,0.06816711028416951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,4096,0.018538667096032035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,4096,0.03303466571701898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,3072,0.009477333062224919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,3584,0.017671111557218764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,3584,0.030787554052140977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,3072,0.030841777722040813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,2560,0.008386666576067606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,2048,0.007259555160999298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,2560,0.015786666009161208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,2560,0.029665778080622356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,1536,0.006601777755551868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,2048,0.01427111029624939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,2048,0.025268443756633337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,1024,0.00519822206762102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,1536,0.023677332533730402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,1536,0.013780444032616086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,768,0.00453244439429707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,1024,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,1024,0.021944888763957556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,512,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,6144,0.017496888836224873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,768,0.012455999851226807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,7168,0.022436444958051045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,256,0.0032435556252797446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,128,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,512,0.011769777370823754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,512,0.01994755533006456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,64,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,256,0.019567999574873183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,256,0.011787555283970304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,6144,32,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,128,0.01146133326821857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,128,0.018604444132910836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,64,0.010684444672531553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,65536,0.10803733269373576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,32,0.011031111081441244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,65536,0.07968978087107341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,51200,0.08605777555041844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,6144,3072,0.016939555605252583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,16384,0.03247022297647264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,51200,0.06254666381412081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,12288,0.026326222552193537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,16384,0.030213332838482324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,12288,0.02348444362481435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,16384,0.05683200226889717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,10240,0.022616000639067754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,12288,0.048828442891438804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,65536,0.15011289384629992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,10240,0.022311111291249592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,51200,0.12313244077894424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,10240,0.043559110826916166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,7168,0.01754755609565311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,6144,768,0.020676443974177044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,8192,0.04109866751564874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,8192,0.020631111330456205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,6144,0.016069332758585613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,7168,0.021939555803934734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,5120,0.014092443717850579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,7168,0.03845422135459052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,4096,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,6144,0.03602844476699829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,6144,0.02055111030737559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,5120,0.033803555700514056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,3584,0.009658666948477427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,5120,0.018921777606010437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,3072,0.008784888519181145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,4096,0.03257688879966736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,3584,0.01702666613790724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,3584,0.03141333328353034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,2560,0.007937777373525832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,3072,0.029108444849650066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,3072,0.01551822159025404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,2048,0.006774222271309958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,2560,0.015190222197108798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,2560,0.02812622321976556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,1536,0.00590844452381134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,2048,0.013806222213639153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,2048,0.024680889315075342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,1024,0.004407111141416761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,1536,0.02402666707833608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,1536,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,768,0.003935111065705617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,1024,0.021640888518757288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,1024,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,512,0.003552000141806073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,768,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,768,0.02174577779240078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,8192,0.019711110326978896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,256,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,512,0.020238222347365487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,128,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,256,0.011794666449228922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,128,0.017895110779338412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,128,0.0103502223889033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,32,0.0028808888875775864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,64,0.01071466671095954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,32,0.011019555230935415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,65536,0.08630488978491889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,4096,0.017779555585649278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,51200,0.06825955708821614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,65536,0.0732426643371582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,51200,0.05840444564819336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,16384,0.026375111606385972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,65536,0.14959200223286948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,16384,0.026172444224357605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,12288,0.020940444535679285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,51200,0.12199555502997504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,5120,512,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,16384,0.0563946697447035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,5120,256,0.02095288866096073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,12288,0.022336888644430373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,12288,0.04805066519313388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,5120,64,0.0025048889219760895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,8192,0.015832889411184523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,10240,0.0207324441936281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,7168,0.014399111270904541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,10240,0.044066667556762695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,8192,0.04080533319049411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,8192,0.01965688831276364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,6144,0.013112000293201871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,5120,0.011869333684444427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,7168,0.038273778226640486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,7168,0.02033511135313246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,6144,0.035437332259284124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,6144,0.019919999771647982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,4096,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,3584,0.01166488892502255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,5120,0.018176888426144917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,5120,0.033923556407292686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,4096,0.017055999901559617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,4096,0.033088889386918806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,3072,0.010334221853150262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,3584,0.031846221950319074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,3584,0.015857777661747403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,2560,0.007241778075695038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,3072,0.015599111715952555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,2560,0.014124444789356656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,2048,0.006506666541099548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,2048,0.025516443782382544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,2048,0.013454222016864352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,1536,0.004879111217127906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,1536,0.013070222404268054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,10240,0.018413333429230582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,1024,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,1024,0.02165066699186961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,768,0.0037706668178240457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,768,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,768,0.02091377807988061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,512,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,512,0.020046222541067336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,512,0.011527111132939657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,256,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,256,0.01925511161486308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,256,0.01072088877360026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,128,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,2560,0.027056000298923914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,64,0.002577777744995223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,128,0.010683555569913654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,128,0.017881777551439073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,4096,32,0.002581333327624533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,64,0.011072888970375061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,65536,0.0790791114171346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,32,0.011030221978823343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,1536,0.02367555598417918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,51200,0.06087377998563978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,65536,0.06986488898595174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,4096,1024,0.012083555261294046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,16384,0.024192000428835552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,51200,0.0566542214817471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,12288,0.019298666053348117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,16384,0.025462221768167283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,16384,0.056186669402652316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,12288,0.022172444396548804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,65536,0.14976621998680964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,10240,0.016754666964213055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,8192,0.014762666490342883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,12288,0.047092444366878934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,10240,0.020475554797384474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,7168,0.013658666776286231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,8192,0.04008000095685323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,8192,0.019268444842762418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,4096,3072,0.029465778006447688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,6144,0.012646222280131446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,7168,0.020562666985723708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,7168,0.03758488761054145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,5120,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,6144,0.019109333554903667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,4096,0.012400888734393649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,5120,0.03360088997417026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,4096,0.01625777781009674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,3584,0.010334221853150262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,4096,0.03289066751797994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,3072,0.010293333066834344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,3584,0.028594666057162817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,3584,0.014920888675583733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,2560,0.00832711077398724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,3072,0.0148026661740409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,3072,0.02741066614786784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,2048,0.005591111050711737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,2560,0.02720888952414195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,2560,0.013809777796268463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,1536,0.004515555583768421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,51200,0.1218951145807902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,2048,0.02516799999607934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,2048,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,1024,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,1536,0.012740444805887012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,768,0.0038311113086011675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,1536,0.022991999983787537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,10240,0.043430222405327686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,1024,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,1024,0.022357333037588332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,512,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,256,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,768,0.020609777834680345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,768,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,512,0.02163022259871165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,128,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,512,0.011694221860832639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,64,0.002756444530354606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,256,0.01921244462331136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3584,32,0.002801777794957161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,6144,0.03630933496687148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,128,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,5120,0.018422222799725003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,65536,0.06368177466922335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,32,0.011057777537239922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,51200,0.05104533169004652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,65536,0.06835555367999606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,16384,0.02060622142420875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,51200,0.05452266666624281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,16384,0.024922667278183833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,65536,0.15064356062147352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,51200,0.12253688441382514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,12288,0.017500445246696472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,16384,0.05498577819930183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,10240,0.01533600025706821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,12288,0.04801155461205376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,12288,0.02164177762137519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,8192,0.01329422245422999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,10240,0.019996444384257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,10240,0.044529779089821704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,7168,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,8192,0.018915555543369718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,256,0.01075644459989336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,8192,0.03978666663169861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3584,128,0.019308444526460435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,7168,0.018862222631772358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3584,64,0.01073066641887029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,7168,0.03882844580544366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,5120,0.010563555690977307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,6144,0.01829155617290073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,6144,0.03719288773006863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,4096,0.009759999811649323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,3584,0.009939555492666032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,5120,0.03329866793420579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,5120,0.01683111157682207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,4096,0.030995554394192163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,4096,0.01549600064754486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,3584,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,3584,0.029512001408471003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,2560,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,3072,0.027429333991474573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,3072,0.014135999812020196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,2048,0.005593777944644292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,2560,0.026787555880016748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,2560,0.013579555683665805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,1536,0.004549333204825719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,2048,0.024097777075237695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,2048,0.01332800007528729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,1024,0.0038728887836138406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,1536,0.02370044423474206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,768,0.003593777616818746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,1024,0.02125066684352027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,1024,0.012533333566453723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,512,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,768,0.020624889267815482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,768,0.01202755586968528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,256,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,512,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,512,0.019897777173254225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,128,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,6144,0.011927111281288994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,256,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,256,0.020981333321995203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,64,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,32,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,3072,128,0.018583999739752877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,128,0.010687111152542962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,64,0.011597333682907952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,65536,0.057769775390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,32,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,51200,0.045700444115532764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,65536,0.06530488861931695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,16384,0.01945955554644267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,51200,0.053139554129706494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,16384,0.024205333656734888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,65536,0.1505368947982788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,16384,0.05546311206287808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,12288,0.01573333309756385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,51200,0.12176799774169922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,10240,0.013776889277829064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,3072,1536,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,8192,0.012483555409643384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,12288,0.04793688986036512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,10240,0.01959022217326694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,10240,0.04371644390953911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,7168,0.011351111034552256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,8192,0.018696889281272888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,8192,0.04038844505945841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,6144,0.010536889235178629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,7168,0.01816444430086348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,7168,0.03820533222622342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,5120,0.009964444571071202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,6144,0.01717333330048455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,6144,0.03638222151332431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,5120,0.015624889069133334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,5120,0.03313688768280877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,3584,0.009297777381208207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,4096,0.030171556605233088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,4096,0.014119999276267158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,3072,0.008271111382378472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,3584,0.013802666631009845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,3584,0.028492444091373022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,2560,0.006254222244024277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,3072,3072,0.008608889248636033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,2048,0.005224888937340842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,3072,0.02796799937884013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,2560,0.027102222045262653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,2560,0.013100444442696042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,1536,0.004545777622196409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,2048,0.025384000606007043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,2048,0.012748444245921241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,1024,0.003843555433882607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,1536,0.012430222498046027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,1536,0.02437422176202138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,768,0.00361333332127995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,1024,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,1024,0.021288888321982488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,512,0.0035297779573334586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,768,0.012086222569147745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,768,0.020569778150982328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,256,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,512,0.011397333608733283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,512,0.020954666866196528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,128,0.002570666579736604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,256,0.011031111081441244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,256,0.01954844428433312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,64,0.002519999941190084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,4096,0.009380444056457942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2560,128,0.018034666776657104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2560,32,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,64,0.010440000229411654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,65536,0.05159644285837809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,32,0.010681777364677854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,51200,0.037328001525666975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,3072,0.013266666895813413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,16384,0.016136000553766888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,51200,0.05122577812936571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,65536,0.15012089411417642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,16384,0.02375999920898014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,12288,0.01313244468635983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,51200,0.12194932831658258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,16384,0.05509333478079902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,12288,0.021291555629836187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,10240,0.01938311093383365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,10240,0.044511109590530396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,8192,0.010398222340477837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,8192,0.040082666609022356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,8192,0.01816177699300978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,7168,0.010601777997281818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2560,128,0.0110880004035102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,6144,0.012476444244384766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,7168,0.017516444126764934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,7168,0.03644799855020311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,5120,0.011804444094498953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,6144,0.015792000624868605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,6144,0.03642755415704515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,65536,0.06247022416856554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,5120,0.015184000134468079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,5120,0.032701333363850914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,3584,0.009195555415418413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,4096,0.014128888646761576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,4096,0.03014666504330105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,3072,0.006568000134494569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,3584,0.013991110854678683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,3584,0.028508444627126057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,2560,0.005933333188295364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,10240,0.01180622229973475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,3072,0.013407111167907715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,3072,0.02751111156410641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,12288,0.020862221717834473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,2048,0.005208888815508948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,1536,0.004527111020353106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,2560,0.025690666503376428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,2048,0.0240328891409768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,2048,0.01276533305644989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,1024,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,1536,0.012334222594896952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,768,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,1024,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,768,0.011371555427710215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,768,0.021651556094487507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,512,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,512,0.020584000481499564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,512,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,256,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,4096,0.010291555689440833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,128,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,256,0.019909333851602342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,256,0.011429333024554782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,64,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,128,0.011547555526097616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,128,0.01830844415558709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,2048,32,0.002505777817633417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,64,0.01108977778090371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,65536,0.03664088911480374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,32,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,12288,0.04767555660671658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,51200,0.029056890143288508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,2048,2560,0.01311644415060679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,65536,0.06083199712965223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,16384,0.013185777597957186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,51200,0.049759109814961754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,1536,0.0229795558585061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,65536,0.15036888917287192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,12288,0.011553777588738335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,16384,0.02343822187847561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,16384,0.05494488941298591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,51200,0.1221662229961819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,2048,1024,0.021312889125612047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,10240,0.01072533345884747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,8192,0.009441778063774109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,12288,0.04749777913093567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,12288,0.020586666133668687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,10240,0.0433573325475057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,10240,0.018763555420769584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,6144,0.008884444832801819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,8192,0.016935111747847665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,8192,0.039566222164365984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,7168,0.016352888610627916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,7168,0.036088890499538846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,5120,0.007992000215583378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,4096,0.006966222491529252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,6144,0.03458222084575229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,6144,0.01551466683546702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,3584,0.007264888948864407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,5120,0.015145777000321282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,4096,0.014107555150985718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,4096,0.030533333619435627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,3072,0.006615110983451207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,3584,0.028809779220157202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,3584,0.013928888572586907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,2560,0.005912888795137405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,3072,0.027112000518374976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,3072,0.013413333230548434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,2048,0.0058666666348775225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,2560,0.02685955497953627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,2560,0.01310222182008955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,1536,0.004271111140648524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,2048,0.013057777451144325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,1024,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,1536,0.01237511138121287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,1536,0.023912888434198167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,768,0.003540444291300244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,1024,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,1024,0.02239822182390425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,512,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,768,0.012107555237081317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,768,0.02162488963868883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,256,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,7168,0.009661333428488838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,512,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,512,0.021498666869269475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,128,0.0028008888992998335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,256,0.01919911139541202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,256,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,64,0.0026382222357723448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,128,0.011431111229790581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1536,32,0.00254488881263468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,5120,0.031153778235117596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,65536,0.026144888665941026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,64,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1536,32,0.011767110890812345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,51200,0.021900445222854614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,65536,0.05812355544832018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,16384,0.01497333414024777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,51200,0.046875556310017906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,65536,0.14907199806637234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,51200,0.12201955583360459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,16384,0.054879112376107105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,16384,0.022319111559126113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,10240,0.011384888655609555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,12288,0.019055111540688407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,12288,0.046579556332694165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,8192,0.010447999669445885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,10240,0.017856000198258292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,10240,0.04309422108862135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,7168,0.010039110978444418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,8192,0.03804088963402642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,8192,0.016721778445773654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,6144,0.009006222089131674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,7168,0.015930665863884818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,7168,0.03528711199760437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,5120,0.008271111382378472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,6144,0.034627556800842285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,6144,0.01553600033124288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,128,0.0192577772670322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,4096,0.007669332954618666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,3584,0.007271111011505127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,5120,0.03086400032043457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,5120,0.014473777678277759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,4096,0.029847111966874864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,3072,0.00656355544924736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,3584,0.027838223510318335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,3584,0.013767999907334646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,2560,0.0058755555914507965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,3072,0.02677333354949951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,2048,0.006636444479227066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,2560,0.01313244468635983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,12288,0.012717333104875354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,1536,0.005557333429654439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1536,2048,0.02426311042573717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,2048,0.012489777472284106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,2048,0.025021332833502028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,1024,0.004866666677925321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,1536,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,1536,0.02269511090384589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,768,0.004209777961174647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,1024,0.021645334031846788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,1024,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,512,0.0035439998739295532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,768,0.020980444219377305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,512,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,512,0.019898666275872123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,256,0.011050666371981302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,4096,0.014119999276267158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,256,0.01937333411640591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,128,0.0030826667530669104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,3072,0.013444444371594323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,128,0.019469334019554984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,128,0.01034400032626258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,32,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,1024,2560,0.025901334153281316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,65536,0.0214035560687383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,64,0.011527111132939657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,32,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,51200,0.018437332577175565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,65536,0.05652444230185615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,16384,0.01055555542310079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,65536,0.1490266720453898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,51200,0.04638311266899109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,12288,0.01110400011142095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,16384,0.02160088883505927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,1024,768,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,10240,0.009988444546858469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,12288,0.01888444523016612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,12288,0.04554933309555054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,8192,0.009359999663299983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,10240,0.04208533300293816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,10240,0.017567111386193168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,7168,0.008636444807052612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,8192,0.037463999456829496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,8192,0.016524444023768108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,6144,0.008287111090289222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,7168,0.015844444433848064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,5120,0.007365333537260692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,6144,0.01516711049609714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,6144,0.03405155407057868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,4096,0.007292444507280986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,5120,0.014545778433481852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,4096,0.013815110756291283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,3584,0.0069822221994400024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,4096,0.02944444285498725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,3584,0.013793778088357715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,3072,0.006790222393141852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,51200,0.12185955047607422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,3072,0.01347644461525811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,16384,0.05283111002710131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,2560,0.006604444649484422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,3072,0.028106666273540918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,2048,0.005244444641802046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,1024,256,0.0032053333189752367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,2560,0.026392888691690233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,2560,0.012805333567990197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,1536,0.005044444567627377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,2048,0.012805333567990197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,2048,0.024726221958796184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,1024,0.0042239998777707415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,1536,0.02450399928622776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,1536,0.012063110868136087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,768,0.0035297779573334586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,7168,0.03499644332461887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,512,0.0035333335399627686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,1024,0.022662222385406494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,1024,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,256,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,512,0.02128533356719547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,5120,0.031144890520307753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,512,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,128,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,256,0.011540444360838996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,64,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,256,0.020953777763578627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,128,0.010684444672531553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,768,32,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,65536,0.017468444175190397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,64,0.011152000062995486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,32,0.011081777513027191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,51200,0.014698666003015308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,65536,0.05542400148179796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,65536,0.14904088444179958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,16384,0.011057777537239922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,51200,0.045570668247010976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,51200,0.12152177757687038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,12288,0.008676444490750631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,16384,0.05359022153748406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,12288,0.019241778386963736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,12288,0.04534488916397095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,10240,0.00832622249921163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,768,768,0.011414222419261932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,10240,0.042169776227739125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,10240,0.017512000269360013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,8192,0.008286221987671321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,7168,0.00795111142926746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,8192,0.03698044353061252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,8192,0.016519111063745286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,6144,0.007607111500369177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,128,0.017893332574102614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,7168,0.015806222955385845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,7168,0.03530577818552653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,5120,0.006960888703664144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,6144,0.03297422329584757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,3584,0.028307557106018066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,4096,0.007258666886223688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,5120,0.031178666485680476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,5120,0.014494222071435718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,3584,0.006911110960774952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,4096,0.01369066701995002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,3072,0.006527110934257507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,3584,0.013174222575293647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,3584,0.027803556786643133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,2560,0.006511111226346757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,3072,0.013068444199032254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,3072,0.02676800058947669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,2048,0.005954666684071223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,16384,0.02155911094612545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,2560,0.012758221891191272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,2560,0.02569155560599433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,1536,0.00452622233165635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,2048,0.024679111109839544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,2048,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,1024,0.003826666623353958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,1536,0.02296977738539378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,1536,0.0118231111102634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,768,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,768,768,0.021947556071811255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,1024,0.011416888899273343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,512,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,768,0.011092444260915121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,256,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,512,0.02126666737927331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,512,0.011027555498811932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,128,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,256,0.010686222049925061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,256,0.020581333173645865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,6144,0.01550044450494978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,64,0.002542222125662698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,128,0.01035822182893753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,128,0.01853155593077342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,65536,0.015519110692871941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,64,0.011600889265537262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,4096,0.02951644526587592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,512,32,0.011037333144081963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,51200,0.013402666482660504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,65536,0.05450755688879225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,16384,0.008676444490750631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,65536,0.14918133947584364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,51200,0.11984622478485107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,12288,0.007999999655617608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,16384,0.021260443660948012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,16384,0.053341332409116954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,10240,0.007629333270920648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,12288,0.018541332748201158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,12288,0.04515199859937032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,8192,0.0069297779765393995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,10240,0.017873777283562552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,10240,0.04092977775467767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,1024,0.022329777479171753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,7168,0.006643555644485686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,512,768,0.020576889316240948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,6144,0.006585777633719974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,8192,0.016153777639071148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,8192,0.038021332687801786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,5120,0.006270222365856171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,7168,0.015811555915408664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,6144,0.032920890384250216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,6144,0.015111999379263984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,4096,0.005616000129116907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,5120,0.03155022197299533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,5120,0.01482222146458096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,512,32,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,3584,0.006256000035338932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,3072,0.006255110932721033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,4096,0.013474666410022311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,4096,0.029394666353861492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,2560,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,3584,0.029446221060223047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,3072,0.013463111387358772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,3072,0.026222222381167944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,2048,0.005958222266700532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,2560,0.02643199927277035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,2560,0.012720000412729053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,1536,0.004512888689835866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,51200,0.043162667089038424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,2048,0.012162666353914471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,1024,0.0038933331767717996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,2048,0.025015999873479206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,768,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,1536,0.02438933319515652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,1024,0.02163822286658817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,1024,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,768,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,768,0.022103110949198406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,256,0.0028106667515304354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,512,0.011026666396194033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,512,0.0214355554845598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,128,0.00254488881263468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,256,0.011400889191362592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,256,0.018984888990720112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,7168,0.03495733274353875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,128,0.011357333097192975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,64,0.002542222125662698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,256,128,0.017675555414623685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,32,0.002499555548032125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,65536,0.014415999253590902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,64,0.01108977778090371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,32,0.010690666735172272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,51200,0.012723555167516073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,65536,0.05147111084726122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,3584,0.013778666655222574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,16384,0.007977777885066139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,65536,0.14739378293355307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,51200,0.04210222098562452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,12288,0.007312888900438945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,51200,0.11839289135403103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,16384,0.021634666456116572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,16384,0.05271733469433255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,10240,0.007296889192528195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,256,1536,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,12288,0.0440942214594947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,8192,0.006637333167923822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,10240,0.017804443836212158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,256,512,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,7168,0.006631111105283101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,8192,0.015956444872750174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,8192,0.0362755556901296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,6144,0.006247111078765657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,7168,0.03542222248183356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,7168,0.015650666422314115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,5120,0.00611200018061532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,6144,0.01516888870133294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,6144,0.033253331979115806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,4096,0.005763555566469829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,5120,0.01443911095460256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,5120,0.03157066636615329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,3584,0.005923555543025334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,4096,0.013794666363133324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,4096,0.02915999955601162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,3072,0.005910222315125995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,3584,0.013648000028398303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,3584,0.02846577763557434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,2560,0.006288888967699475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,3072,0.013061333033773633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,3072,0.02682222260369195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,2048,0.005904888941182031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,2560,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,2560,0.026791999737421673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,1536,0.004512888689835866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,2048,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,2048,0.024550222688251074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,1024,0.003903111235962974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,1536,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,768,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,1024,0.021264889174037512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,1024,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,12288,0.01831999917825063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,512,0.003228444399105178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,768,0.011776000261306763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,10240,0.04213866591453552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,256,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,768,0.020220445262061227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,512,0.020240000552601285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,128,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,512,0.01075111081202825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,64,0.0024684444069862366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,256,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,128,0.017847110827763874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,128,32,0.0025155554629034465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,128,0.01035822182893753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,65536,0.011161777708265515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,64,0.009859555297427708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,51200,0.01038044442733129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,16384,0.007283555964628856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,128,32,0.010838222172525195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,12288,0.006467555546098285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,65536,0.05101066827774048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,10240,0.005956444475385878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,16384,0.021591999464564856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,12288,0.018527110417683918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,10240,0.017217778497272067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,7168,0.006129777679840724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,8192,0.01612711118327247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,6144,0.005884444548024072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,7168,0.015691555208630033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,1536,0.022700443863868713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,5120,0.005618666609128316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,4096,0.005405333307054307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,6144,0.015127999915017022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,3584,0.005943999936183293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,5120,0.014436443646748861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,3072,0.005568000177542369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,4096,0.013757333159446716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,2560,0.006031999985376994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,3584,0.013411555853154926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,2048,0.005619555711746216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,16,128,256,0.020595555504163105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,3072,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,1536,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,2560,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,2048,0.012390221986505719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,1536,0.012086222569147745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,768,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,1024,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,512,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,256,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,51200,0.04210933380656772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,768,0.011066666907734342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,128,0.002534222271707323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,64,0.002489777695801523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,8192,0.006606222026877933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,512,0.011032889286677042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,256,0.010679999987284342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,32,0.0028515555378463534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,128,0.010401777923107147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,65536,0.009723555710580613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,64,0.00999466660949919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,64,32,0.010813333094120026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,16384,0.006245333287451003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,65536,0.05072888731956482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,12288,0.006233777850866318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,51200,0.042774223619037204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,10240,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,16384,0.020929776959949072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,8192,0.0052826665341854095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,7168,0.005610666755172942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,12288,0.018248000078731112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,10240,0.01789066692193349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,6144,0.005578666511509154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,5120,0.005581333405441708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,7168,0.01550044450494978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,4096,0.005547555370463266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,6144,0.015466666883892484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,5120,0.014456000592973499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,3584,0.005938666562239329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,3072,0.005609777652555042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,4096,0.013414222333166333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,64,1024,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,2560,0.005895111295912001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,3584,0.013791999883121915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,2048,0.005271111097600725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,3072,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,1536,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,1024,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,2560,0.01276000009642707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,768,0.0035004446076022256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,1536,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,512,0.003148444410827425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,1024,0.011408000356621213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,256,0.0024906665914588505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,768,0.011384000380833944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,128,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,512,0.011055111057228513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,51200,0.008314666648705801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,64,0.0024684444069862366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,256,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,16,32,32,0.002465777720014254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,128,0.010408889088365767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,64,0.0103511114915212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,32,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,8192,0.015853333804342482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,16384,0.17270755767822266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,16384,0.3240017890930176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,12288,0.22732623418172201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,51200,0.5001280042860243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,10240,0.1892817815144857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,12288,0.1309395498699612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,16,32,2048,0.01276711126168569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,8192,0.15521866745418972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,10240,0.11145599683125813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,7168,0.13405599859025744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,6144,0.11576799551645915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,8192,0.13714310857984754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,7168,0.1003004444970025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,5120,0.09742133484946357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,6144,0.0920213328467475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,4096,0.08151377571953668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,3584,0.06955999798244901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,3072,0.06041777796215481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,4096,0.06876089175542195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,5120,0.08121955394744873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,2560,0.051206221183141075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,3584,0.06086933612823486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,2048,0.04200622108247545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,3072,0.052783999178144664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,1536,0.03270577722125583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,2560,0.04647199975119697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,768,0.0188755558596717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,2048,0.04485955503251818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,1536,0.03433777888615926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,512,0.013782222237851886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,1024,0.02758311066362593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,256,0.008268444074524773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,128,0.006227555374304454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,768,0.023530667026837666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,64,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,512,0.019157333506478202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,256,0.016584888100624084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,32,0.005904888941182031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,128,0.014142221874660917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,64,0.016177778442700703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,51200,0.9695093366834852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,65536,32,0.01621866722901662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,65536,1024,0.02382044494152069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,65536,0.5281937917073568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,51200,0.824494202931722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,65536,1.0936098098754883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,16384,0.2784453233083089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,12288,0.20238399505615234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,16384,0.13993955983055964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,51200,0.4021448824140761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,10240,0.1735475593143039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,8192,0.13890933990478516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,12288,0.10704888900121053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,7168,0.1229048834906684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,7168,0.09552088710996841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,8192,0.10441688696543376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,6144,0.10630133416917588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,5120,0.08964888917075263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,10240,0.09176266855663723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,4096,0.0728986660639445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,5120,0.06732177734375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,4096,0.05599111318588257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,6144,0.07431288560231526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,3072,0.05515377720197042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,2560,0.047578665945265025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,2048,0.038763556215498186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,3072,0.04438933398988512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,1536,0.03012266755104065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,2560,0.039635555611716375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,1024,0.02125066684352027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,2048,0.03674488928582933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,768,0.016351110405392118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,1536,0.0296088887585534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,512,0.011501332951916588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,768,0.021336000826623704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,256,0.007359999749395583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,512,0.017471111483044095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,1024,0.023020444644822016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,128,0.004168888760937585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,64,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,256,0.01514400045077006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,128,0.014098667436175875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,32,0.003530666646030214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,64,0.01442399952146742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,32,0.015454222758611044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,51200,3584,0.0632986691262987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,51200,3584,0.048651556173960366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,65536,0.18894133302900526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,65536,0.3211608992682563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,16384,0.09099644422531128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,51200,0.2503608862559001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,51200,0.14293600453270808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,12288,0.07186222076416016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,16384,0.05713422430886162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,8192,0.045583999819225736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,10240,0.053156445423762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,12288,0.044960889551374644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,10240,0.0404151115152571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,6144,0.0332293344868554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,7168,0.03904799951447381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,8192,0.04089066717359755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,7168,0.03825155562824673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,4096,0.024511999554104272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,3584,0.021585777401924133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,5120,0.03235288792186313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,3072,0.01885600056913164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,4096,0.02723377777470483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,2560,0.016148444679048326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,3584,0.025128000312381323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,2048,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,3072,0.0229102224111557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,1536,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,2560,0.021430222524536982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,1024,0.008611555728647444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,1536,0.018195556269751657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,768,0.007054222126801808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,1024,0.0158595558669832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,512,0.005554666535721884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,256,0.0032222221295038858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,768,0.014109333356221518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,128,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,256,0.012784000072214337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,64,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,128,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,32,0.0029297777348094513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,64,0.012741333080662621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,16384,5120,0.028845333390765723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,6144,0.03613155417972141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,32,0.011785777906576792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,65536,0.2533288796742757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,65536,0.1592879957622952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,51200,0.1996826728185018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,51200,0.12355911731719971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,16384,0.0671831104490492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,12288,0.05276977684762743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,16384,0.0506915549437205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,10240,0.04485866758558485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,2048,0.02010577751530541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,12288,0.04054222173160977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,7168,0.033189333147472806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,8192,0.038402666648228966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,10240,0.036159111393822566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,6144,0.029010666741265193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,5120,0.025640888346566096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,16384,512,0.013360888593726687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,7168,0.03422133458985223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,6144,0.031170666217803955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,4096,0.020266667008399963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,3584,0.01759022143152025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,3072,0.015798222687509324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,4096,0.025439111722840205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,5120,0.028939555088678997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,3584,0.023189332750108507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,2560,0.013215999636385175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,2048,0.011341333389282227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,1536,0.009401777552233802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,3072,0.020977778567208186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,1024,0.007861333588759104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,2048,0.018868444694413077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,768,0.006346666564544042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,1536,0.0173973325226042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,512,0.004601777841647466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,768,0.013767110804716745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,256,0.003637333297067218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,512,0.013070222404268054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,128,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,8192,0.03765866822666592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,256,0.012106666962305704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,64,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,128,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,12288,32,0.00291377781993813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,64,0.01148977792925305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,32,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,65536,0.21787822246551514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,65536,0.15313243865966797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,16384,0.060157332155439586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,51200,0.11834222740597194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,2560,0.020459555917316012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,12288,0.04708533485730489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,16384,0.04783199893103706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,10240,0.038784000608656145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,12288,1024,0.014436443646748861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,12288,0.039375109805001154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,7168,0.029393778906928167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,10240,0.03495999839570787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,8192,0.03429066803720262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,6144,0.02645422187116411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,5120,0.02257599929968516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,6144,0.02716355522473653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,4096,0.018213333355055917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,5120,0.024655999408827886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,3584,0.015792000624868605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,4096,0.02239822182390425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,3072,0.01458666721979777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,3584,0.02093688812520769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,51200,0.17372622754838732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,2560,0.012378666963842181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,3072,0.019734222027990553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,2048,0.017308443784713745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,1536,0.008993777963850234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,8192,0.03281777766015794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,1536,0.016199111938476562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,1024,0.00740622232357661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,768,0.005708444449636672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,1024,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,7168,0.0309840010272132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,512,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,256,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,768,0.013445333474212222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,128,0.003192000091075897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,512,0.013144888811641268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,64,0.0031999999450312722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,256,0.012083555261294046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,32,0.002991111121243901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,128,0.011492444409264458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,32,0.012476444244384766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,65536,0.1748124493492974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,51200,0.13223911656273737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,65536,0.10311200221379598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,16384,0.04586933387650383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,10240,2048,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,12288,0.033040000332726374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,51200,0.08060089084837171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,10240,0.02786311176088121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,8192,0.02570666703912947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,16384,0.03661777906947666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,2560,0.01869777838389079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,7168,0.021807110971874658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,10240,0.027447111076778833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,6144,0.01924088928434584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,5120,0.016568889220555622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,4096,0.014165333575672574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,7168,0.024314666787783306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,6144,0.023939554889996845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,3584,0.012660444610648684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,5120,0.021543999512990315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,3072,0.011681777735551199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,2560,0.009967111051082611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,3584,0.018581334087583754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,3072,0.017684444785118103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,2048,0.008559111091825698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,2560,0.017256889078352187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,1536,0.007616000043021307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,2048,0.015840889679061044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,1024,0.005605333381228977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,1536,0.014467555615637036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,768,0.0042204442951414315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,10240,64,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,1024,0.013307555682129331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,512,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,256,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,768,0.01276000009642707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,128,0.003198222153716617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,512,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,64,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,256,0.012415111064910889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,8192,32,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,12288,0.03014755580160353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,128,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,8192,0.026955554882685345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,64,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,32,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,65536,0.15100977155897352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,16384,0.04196000099182129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,51200,0.11788711282942031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,65536,0.09584977891710068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,12288,0.033336000310050115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,51200,0.07390399773915608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,10240,0.02832177612516615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,8192,0.02219911085234748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,16384,0.0343848897351159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,12288,0.028343111276626587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,7168,0.020601777566803824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,10240,0.025349333882331848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,6144,0.017680888374646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,8192,0.02716000046994951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,5120,0.015603555573357476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,4096,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,7168,0.0236471113231447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,3584,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,6144,0.023000000251664057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,3072,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,2560,0.009661333428488838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,4096,0.019162666466501024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,3584,0.017994667092959087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,2048,0.00832711077398724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,3072,0.01738933391041226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,2560,0.01685333251953125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,1024,0.005233777893914117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,2048,0.015272888872358533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,768,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,1536,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,512,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,1024,0.01311555587583118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,256,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,768,0.012504888905419244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,128,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,512,0.012090666426552666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,64,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,256,0.012122666670216454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,32,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,128,0.011352889239788055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,64,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,8192,4096,0.019380443625979953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,32,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,51200,0.09751911295784844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,65536,0.08688266409767999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,16384,0.036228444841172956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,51200,0.0680168867111206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,12288,0.028753777345021565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,7168,5120,0.02091377807988061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,16384,0.03229511115286086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,10240,0.02495999965402815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,12288,0.02657777733272976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,8192,0.021644444929228887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,7168,0.01941777765750885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,10240,0.02294933299223582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,8192,0.024361777636739943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,7168,0.022630222969584998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,5120,0.01516888870133294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,6144,0.021520889467663232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,4096,0.012135110795497894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,3584,0.010496888723638324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,5120,0.020522667302025687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,4096,0.018179555733998615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,3072,0.009979555176364051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,2560,0.008952889177534316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,3584,0.017863111363516915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,2048,0.007826666865083907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,3072,0.01677600045998891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,1536,0.006897777732875612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,65536,0.12306488884819879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,2048,0.01443822185198466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,1536,0.013754666679435305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,768,0.004074666649103165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,1024,0.012777778009573618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,512,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,768,0.012350222302807702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,512,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,7168,1536,0.007296889192528195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,256,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,6144,0.017143999536832173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,128,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,64,0.0028479999552170434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,32,0.0026355555488003623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,256,0.01239377756913503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,128,0.012106666962305704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,64,0.011354666617181567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,65536,0.10695199833975898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,32,0.011394666300879585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,51200,0.08629333310657078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,16384,0.0322088897228241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,65536,0.07922577857971191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,12288,0.026183999247021143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,10240,0.022543110781245764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,51200,0.06230577495363024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,16384,0.030155556069480047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,8192,0.0196088883611891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,12288,0.024352888266245525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,6144,2560,0.016137777103318107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,10240,0.021703999903466966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,6144,0.015740444262822468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,6144,1024,0.004640000147951974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,8192,0.024269334144062463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,5120,0.013962666193644205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,4096,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,3584,0.010386666489972008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,6144,0.020917332834667627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,3072,0.009388444324334463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,4096,0.018020444446139865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,2560,0.00833155545923445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,3584,0.017729777428838942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,2048,0.007595555649863348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,3072,0.016128889388508268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,1536,0.006095110956165526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,2560,0.014886221951908536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,1024,0.004224888980388641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,2048,0.014440000057220459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,768,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,1536,0.01346666696998808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,512,0.003573333223660787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,1024,0.01274400038851632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,256,0.003024000053604444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,768,0.012376888758606382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,128,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,256,0.01202666676706738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,64,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,128,0.011407111254003314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,32,0.002537777854336633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,64,0.011764444410800934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,5120,7168,0.017472000585661996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,32,0.011076444553004371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,65536,0.08683022525575425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,7168,0.02167911165290409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,51200,0.06823111242718168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,16384,0.028039111031426325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,65536,0.07150399684906006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,5120,0.01957155598534478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,10240,0.018979556030697294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,16384,0.02637333340115017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,12288,0.02251288957066006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,8192,0.01688799924320645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,7168,0.013747555514176687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,10240,0.020572443803151447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,6144,0.012239110966523489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,8192,0.022681777675946552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,7168,0.020921778347757127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,5120,0.010964444114102257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,4096,0.010447111394670276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,6144,0.020252444677882724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,3584,0.008628444539176093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,5120,512,0.012099555797047086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,5120,0.018820444742838543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,3072,0.007948444121413762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,4096,0.017529777354664274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,2560,0.007157333195209503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,2048,0.006215999937719769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,3072,0.014451555079884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,1536,0.004699555536111196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,2560,0.014543111125628153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,2048,0.013814222481515674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,1536,0.013105777402718862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,768,0.0035626664757728577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,1024,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,512,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,256,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,12288,0.02197244432237413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,768,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,512,0.012055111428101858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,128,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,51200,0.05800977680418226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,32,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,256,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,128,0.011215111447705163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,64,0.012146666646003723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,65536,0.07858133316040039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,32,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,51200,0.06079555882347954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,16384,0.024234667420387268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,65536,0.0692302253511217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,51200,0.05618844429651896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,16384,0.02550933261712392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,10240,0.01686755485004849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,12288,0.02201955517133077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,4096,3584,0.01625066664483812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,8192,0.014721777704026965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,7168,0.013763555222087435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,10240,0.02030311193731096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,6144,0.0118568887313207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,1024,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,8192,0.022611555125978258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,5120,0.010628444453080496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,7168,0.020245333512624104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,4096,0.0098213329911232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,3584,0.008626666333940294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,5120,0.01829600003030565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,3072,0.007895111209816402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,4096,0.015807110402319167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,3584,0.015525332755512662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,4096,64,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,3072,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,2048,0.005664000080691443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,1536,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,2560,0.014446222119861178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,1024,0.003855111284388436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,2048,0.013532444834709167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,768,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,1536,0.012759110993809171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,512,0.0032142222755485107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,1024,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,256,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,12288,0.01920711166328854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,768,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,128,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,512,0.012104888757069906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,64,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,32,0.0026551110463009942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,256,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,128,0.011071999867757162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,65536,0.06384088595708211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,32,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,51200,0.05087111062473721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,16384,0.020584000481499564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,65536,0.06759644216961332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,12288,0.017208000024159748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,51200,0.05439200003941854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,6144,0.01923733287387424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,10240,0.017030222548378837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,16384,0.02495199938615163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,8192,0.014877332581414117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,12288,0.02127200033929613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,7168,0.012473777764373355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3584,2560,0.0069466663731469055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,10240,0.019938665959570143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,6144,0.011328889264000786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,5120,0.009856888817416297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,8192,0.020015999674797058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,7168,0.019595555133289762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,3584,0.008025777836640676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,6144,0.018221333622932434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,5120,0.01682400041156345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,3072,0.0074177781740824384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,2560,0.0064737776087390045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,4096,0.015114666687117683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,2048,0.0052284445199701525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,3584,0.01479466590616438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,3072,0.013811555173661975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,1536,0.004570666700601578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,1024,0.003913777983850903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,2560,0.014112000664075216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,768,0.003488000068399641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,2048,0.013400889105266996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,512,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,1536,0.012792000340090858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,1024,0.01222222215599484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,768,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,512,0.012072000238630505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3584,64,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,64,0.002965333354141977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,256,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,32,0.0025475554996066624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,128,0.01178311142656538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,64,0.011398221883508893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,65536,0.057484441333346896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,3072,32,0.01109155515829722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,51200,0.045328001181284584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,16384,0.01906844476858775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,65536,0.06493777698940702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,51200,0.052729778819613986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,12288,0.01556622154182858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,10240,0.014456889695591398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,4096,0.00923733330435223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,16384,0.024362666739357844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,8192,0.012898666991127862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,12288,0.020863110820452373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,7168,0.0120000003112687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,10240,0.01959111127588484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,6144,0.010660444696744284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,8192,0.019557333654827543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,7168,0.018595554762416415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,5120,0.010006222460005019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,6144,0.017030222548378837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,4096,0.008791999684439765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,3584,0.007920888562997183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,5120,0.015461333923869662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,256,0.0028906667398081887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,3072,0.006918222126033571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,2560,0.005888000130653381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,3584,0.014454222387737699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,3072,128,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,2048,0.005211555709441503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,1536,0.004548444516128964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,3072,0.013696889082590738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,1024,0.003975999852021535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,768,0.0035297779573334586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,2048,0.012844444149070315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,1536,0.01275644451379776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,512,0.003330666571855545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,1024,0.012067555553383298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,256,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,768,0.011794666449228922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,128,0.0025804444319672054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,64,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,512,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2560,32,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,256,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,128,0.011382222175598145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,65536,0.050196445650524564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,64,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,32,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,51200,0.037181334363089666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,16384,0.016364443633291457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,65536,0.06252533197402954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,12288,0.014781332678265043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,51200,0.0510808891720242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,10240,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,16384,0.023982221881548565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,8192,0.01294311136007309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,12288,0.02092622220516205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,7168,0.011143111520343356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,6144,0.0103511114915212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,10240,0.019335110982259113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,8192,0.019291554888089497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,5120,0.009850666754775578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,4096,0.00797155582242542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,4096,0.014811555544535318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,6144,0.015505777464972602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,3584,0.007290666302045186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,3072,0.006793777975771163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,5120,0.014846222268210517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,2560,0.005909333212508096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,4096,0.014147554834683737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,3584,0.014087110757827759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2560,2560,0.01369511087735494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,3072,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,2560,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,1024,0.003955555458863576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,2048,0.012852444416946836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,1536,0.01238666640387641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,768,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,512,0.0032177778581778207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,1024,0.011720000041855706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,256,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,768,0.011753777662913004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,128,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,512,0.012064889073371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,64,0.002534222271707323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,256,0.011535999675591787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,32,0.002495999965402815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,128,0.011343110766675739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,64,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,65536,0.036666668123669095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,51200,0.029250668154822454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,32,0.010828444527255164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,16384,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,65536,0.0606222218937344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,12288,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,51200,0.04907733201980591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,2048,7168,0.017417778571446735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,10240,0.01145333300034205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,16384,0.02336888843112522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,8192,0.010214221974213919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,7168,0.009738666315873465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,12288,0.020581333173645865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,10240,0.018755555152893066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,6144,0.009939555492666032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,2048,0.004913777940803104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,8192,0.016494222813182406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,5120,0.008750222623348236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,2048,1536,0.004515555583768421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,4096,0.007606222397751278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,7168,0.015846222639083862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,3584,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,3072,0.00655377780397733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,6144,0.015184000134468079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,2560,0.005879111174080107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,5120,0.014610666367742749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,4096,0.014106666048367819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,2048,0.004895110925038655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,3584,0.013756444056828817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,1536,0.00452977791428566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,3072,0.013125333521101209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,2560,0.013423110875818463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,2048,0.012545777691735161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,768,0.0034888887570963967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,512,0.003216888962520493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,1536,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,1024,0.011776888536082374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,256,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,128,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,768,0.011411555939250521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,512,0.011761777930789523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,256,0.011404444773991903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,32,0.002529777793420686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,128,0.011027555498811932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,64,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1536,32,0.011047110789351992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,51200,0.02165511084927453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,65536,0.05723377731111315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,16384,0.011920889218648275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,51200,0.04725511206520928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,12288,0.011579555769761404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,16384,0.022281777527597215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,10240,0.010370666782061258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,12288,0.019259555472267997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,10240,0.017854221993022494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,8192,0.008856000171767341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,1024,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,7168,0.009656888743241629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,6144,0.008914666871229807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,8192,0.016541333662139047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,7168,0.015785778562227886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,6144,0.01518311103185018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,4096,0.007302222152551015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1536,64,0.0024764444679021835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,3584,0.006960888703664144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,5120,0.014463999205165438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,3072,0.006220444622966979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,4096,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,65536,0.02590755621592204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,2560,0.005602666487296422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,3584,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,2048,0.006923555499977536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,1536,0.005616888817813661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,2560,0.013081777426931592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,2048,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,1536,0.012439111040698158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,768,0.004223111189073986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,1024,0.011770666473441653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,512,0.003488000068399641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,768,0.011688888900809817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,256,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,512,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,128,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,256,0.01143022212717268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,64,0.002642666714058982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,128,0.011083555718262991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,5120,0.00795733349190818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,64,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,65536,0.02352711061636607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,32,0.01090133355723487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,51200,0.019333332777023315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,65536,0.05630399783452352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,16384,0.01127644462717904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,1024,3072,0.01333688861793942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,51200,0.04574399855401781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,16384,0.021333333518770006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,10240,0.009676444033781687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,1024,0.004583999928500918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,8192,0.008614222208658854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,12288,0.0188737776544359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,7168,0.009020444419648912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,6144,0.008628444539176093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,10240,0.017508443858888414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,8192,0.016208888755904306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,5120,0.007893333004580604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,7168,0.015840000576443143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,4096,0.007310222420427535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,6144,0.014945778581831189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,5120,0.01445777714252472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,4096,0.013799111048380533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,3072,0.006232000059551663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,2560,0.00553955551650789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,3584,0.013739555246300168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,2048,0.004924444274769889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,3072,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,1536,0.004910222358173794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,2560,0.01310488912794325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,1024,32,0.0025804444319672054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,1024,0.004002666721741359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,2048,0.012453333371215396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,768,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,512,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,1536,0.01238666640387641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,256,0.0028515555378463534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,1024,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,768,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,128,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,512,0.011431111229790581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,64,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,256,0.0110871113008923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,128,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,32,0.002518222149875429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,12288,0.011326221956147088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,65536,0.017476444443066914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,64,0.010900444454616971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,51200,0.01605955594115787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,768,32,0.010758221977286868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,16384,0.01037599974208408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,12288,0.010029333333174387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,51200,0.04515022370550367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,10240,0.008972444468074376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,16384,0.021316443880399067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,12288,0.018580444984965853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,8192,0.008160889148712158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,768,3584,0.0069875551594628235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,7168,0.00902133352226681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,6144,0.008346666892369589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,10240,0.017275555266274344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,8192,0.016189333465364244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,7168,0.01565511193540361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,4096,0.0069777775141927935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,6144,0.014847111370828418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,3584,0.0069679998689227635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,5120,0.014475555883513557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,3072,0.006739555547634761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,4096,0.013444444371594323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,2560,0.005961777849329843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,3584,0.013467555244763693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,2048,0.006256000035338932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,3072,0.01311555587583118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,1536,0.004690666579537922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,2560,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,1024,0.0038604442444112566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,2048,0.01239733315176434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,768,0.003624000069167879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,1536,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,512,0.003216888962520493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,1024,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,256,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,768,0.011378666592968835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,128,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,65536,0.05489777856402927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,512,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,64,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,256,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,128,0.011207111179828644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,64,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,65536,0.017160000072585214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,512,32,0.011048888994587792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,51200,0.01477777792347802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,16384,0.009332444104883406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,5120,0.007976888782448238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,65536,0.053344001372655235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,51200,0.042727109458711415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,16384,0.02093244426780277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,10240,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,8192,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,12288,0.018570666511853535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,7168,0.006639110959238476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,10240,0.017400888933075797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,6144,0.00692622239391009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,5120,0.0069146665434042616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,7168,0.015615999698638916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,4096,0.006302222195598815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,6144,0.015124445160230001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,5120,0.014451555079884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,3584,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,3072,0.006052444378534953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,4096,0.013809777796268463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,2560,0.005928888916969299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,3584,0.01348355578051673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,3072,0.013428444663683573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,2048,0.005607111172543631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,1536,0.0042453333735466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,2560,0.013165333204799227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,512,32,0.0025724443710512584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,1024,0.0038862224254343244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,768,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,2048,0.012454222473833295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,512,0.003228444399105178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,1024,0.012063999970753988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,256,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,768,0.011357333097192975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,128,0.0024986666523747975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,512,0.012074666718641916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,12288,0.008039111064540016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,64,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,256,32,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,256,0.011864888999197217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,128,0.01105955574247572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,65536,0.015127110812399121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,64,0.01069866700304879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,51200,0.012582222620646158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,32,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,16384,0.00830844458606508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,12288,0.007639110916190677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,8192,0.016155555844306946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,51200,0.04176000091764662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,16384,0.02125599980354309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,10240,0.006937777830494775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,12288,0.019259555472267997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,10240,0.01754666699303521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,7168,0.00628355559375551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,8192,0.016504888733228047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,6144,0.006281777802440856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,7168,0.01569688816865285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,5120,0.005982222242487802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,6144,0.015481778317027621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,4096,0.005929777605666055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,256,1536,0.012290666500727335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,3584,0.006236444330877728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,5120,0.014492443866199918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,3072,0.005946666830115848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,4096,0.014148443937301636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,2560,0.00629066675901413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,3584,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,2048,0.00555377784702513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,3072,0.013423999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,1536,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,2560,0.013156444662147097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,1024,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,2048,0.0124195557501581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,768,0.003569777641031477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,512,0.0031999999450312722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,1536,0.01256711118751102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,256,0.002871111035346985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,1024,0.01200799975130293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,128,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,768,0.011388444238238864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,8192,0.006613333192136552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,64,0.0024826667375034755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,128,32,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,256,0.011742221812407175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,65536,0.011196444431940714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,128,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,51200,0.010381333529949188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,64,0.01069866700304879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,16384,0.006592000110281839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,32,0.010400888820489248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,12288,0.007266666326257918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,65536,0.05100889007250468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,10240,0.006630222416586346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,51200,0.04244622257020739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,8192,0.006634666687912411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,16384,0.020640000700950623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,7168,0.00646311127477222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,12288,0.018547554810841877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,6144,0.006287999865081575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,10240,0.017247110605239868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,5120,0.005934222290913264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,8192,0.016207999653286405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,4096,0.005600888695981767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,7168,0.015459555718633862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,3584,0.006141333530346553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,6144,0.014783999986118741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,3072,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,5120,0.014153778553009033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,2560,0.005946666830115848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,4096,0.013812444276279874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,2048,0.005931555396980709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,3584,0.013430222041077085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,1536,0.004540444248252445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,3072,0.01312711089849472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,1024,0.003564444267087512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,2560,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,768,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,2048,0.012717333104875354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,512,0.0032035555276605818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,1536,0.012227555943859948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,256,0.0028071111689011254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,128,0.002805333377586471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,1024,0.011759111450778114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,64,0.002473777780930201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,768,0.011077333655622272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,65536,0.05074222220314873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,512,0.011768889096048145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,64,32,0.0024871110088295406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,256,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,65536,0.011353777514563667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,128,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,51200,0.0099982221921285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,64,0.011021333436171213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,16384,0.006912888752089606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,128,512,0.011800888511869641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,64,32,0.010037333601050908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,12288,0.006648889018429651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,10240,0.00692622239391009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,65536,0.051001777251561485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,8192,0.0063075555695427795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,51200,0.04242755638228523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,7168,0.005612444546487596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,16384,0.02070755594306522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,6144,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,12288,0.018592889110247295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,5120,0.005209777918126848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,10240,0.017337777548366122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,8192,0.01650311052799225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,4096,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,3584,0.005598222215970357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,7168,0.015503999259736804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,3072,0.0052639999323421055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,2560,0.00563466673096021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,5120,0.014491554763582019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,4096,0.013456888496875763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,2048,0.005610666755172942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,3584,0.013805333111021252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,3072,0.013076444466908773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,1536,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,1024,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,2560,0.01313333296113544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,768,0.003399111123548614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,2048,0.012087110843923358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,1536,0.012491555677519904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,1024,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,256,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,768,0.011416888899273343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,128,0.002522666628162066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,512,0.011152889165613385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,256,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,128,0.011411555939250521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,64,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,32,0.01130844404300054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,16384,0.3262426588270399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,15,32,6144,0.014847111370828418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,51200,0.501131534576416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,12288,0.22697777218288848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,512,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,16384,0.17191021972232393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,51200,0.9618604448106555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,12288,0.13062755266825357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,15,32,64,0.002473777780930201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,8192,0.15588533878326416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,10240,0.1890960004594591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,7168,0.13384355439080134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,7168,0.10220088561375935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,6144,0.11555288897620307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,5120,0.0971520013279385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,8192,0.11585599846310085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,4096,0.08072266976038615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,6144,0.09466933541827732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,5120,0.08078489038679335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,3584,0.06945066981845431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,3072,0.060292442639668785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,2560,0.05075822273890177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,4096,0.06722578075197008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,3072,0.05379911263783773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,2560,0.04878133204248217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,3584,0.05783466498057047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,2048,0.038732445902294584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,1024,0.023504889673656885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,768,0.01882222294807434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,1536,0.0347946650452084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,512,0.013478221992651621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,1024,0.026946667167875502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,256,0.008215111162927415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,512,0.018921777606010437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,10240,0.11187199751536052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,128,0.0063573333124319715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,64,0.005888000130653381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,256,0.01646488904953003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,32,0.005888888819350137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,128,0.014426666829321118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,64,0.014945778581831189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,32,0.016167110866970487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,2048,0.04185333185725742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,65536,1536,0.03243022163709005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,65536,0.5259733200073242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,16384,0.2755875587463379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,65536,768,0.023644444015291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,51200,0.4017288949754503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,51200,0.8482497533162435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,65536,1.0896480348375108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,12288,0.20572266313764784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,16384,0.13949778344896105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,10240,0.16904800468020967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,12288,0.10688000255160862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,8192,0.09465866618686253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,7168,0.12067111333211263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,6144,0.10607733329137166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,7168,0.08309600088331434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,6144,0.07646666632758246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,4096,0.0711395541826884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,5120,0.06742933061387804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,3584,0.06275555822584364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,4096,0.05686666568120321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,3072,0.05487822161780464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,2560,0.04606399933497111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,3584,0.048808889256583325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,3072,0.04548089040650261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,2048,0.038373334540261164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,2560,0.0406640006436242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,1536,0.029969778325822618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,1024,0.02147644427087572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,2048,0.033131556378470525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,768,0.016136889656384785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,512,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,1536,0.02921244502067566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,768,0.020340444313155282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,256,0.00757422215408749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,512,0.017457778255144756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,128,0.003922666526503033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,256,0.014480888843536377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,8192,0.14086843861473933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,64,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,32,0.0035866668654812705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,128,0.013765333427323235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,51200,5120,0.0883644421895345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,64,0.013773333695199756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,32,0.014487110906177096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,65536,0.31988623407151967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,51200,0.25003377596537274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,65536,0.18348799811469185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,51200,0.14158311155107287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,16384,0.09126222133636475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,12288,0.07135377989874946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,10240,0.053287999497519604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,16384,0.056532442569732666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,12288,0.04514666729503208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,7168,0.03916533456908332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,8192,0.04435822367668152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,10240,0.04012889001104567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,8192,0.04200977749294705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,6144,0.03347911106215583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,5120,0.029140445921156142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,7168,0.03776266508632236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,4096,0.024604444702466328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,3584,0.02158044444190131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,6144,0.03628266519970364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,5120,0.031678222947650485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,3072,0.01889155473974016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,4096,0.027170666389995154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,10240,0.09161955780453152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,2560,0.016136000553766888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,2048,0.013412444127930535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,1536,0.010690666735172272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,3584,0.02439022229777442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,2560,0.021687999367713928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,1024,0.008606221940782335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,768,0.006912888752089606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,2048,0.020287111401557922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,1536,0.017861333158281114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,512,0.004914666629499859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,1024,0.015455999308162265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,256,0.003519999898142285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,768,0.01382844481203291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,128,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,64,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,512,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,16384,32,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,256,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,128,0.011747555600272285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,64,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,32,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,65536,0.25268620914883083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,65536,0.16063200102912054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,51200,1024,0.023365333676338196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,51200,0.20015645027160645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,16384,0.06699466705322266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,51200,0.12305688858032227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,12288,0.05227466755443149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,10240,0.04485688938034905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,16384,0.050072001086341016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,12288,0.04061333338419596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,7168,0.0331857767370012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,10240,0.03613777624236213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,6144,0.029065777858098347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,8192,0.037567999627855085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,5120,0.025662221842341956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,16384,3072,0.023342221975326538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,6144,0.03194222185346816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,7168,0.03572533196873135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,4096,0.020227554771635268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,3584,0.017543110582563613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,3072,0.015832000308566622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,2560,0.013429332938459186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,4096,0.02558044426971012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,3584,0.022385777698622808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,2048,0.011348444554540845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,3072,0.021951999929216173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,2560,0.02086488902568817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,1024,0.007823111282454597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,1536,0.01713244451416863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,2048,0.019357333580652874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,768,0.006212444355090459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,512,0.004540444248252445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,1024,0.014454222387737699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,256,0.0035617777870761026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,768,0.01387111097574234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,128,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,512,0.01240355521440506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,64,0.0031786666562159858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,256,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,32,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,128,0.011371555427710215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,8192,0.03765689002143012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,64,0.011696000066068439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,32,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,65536,0.2180968920389811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,51200,0.17278488477071127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,65536,0.15268177456325954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,16384,0.060064891974131264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,51200,0.11804621749454075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,12288,0.04696711235576206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,10240,0.03872177667087979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,12288,5120,0.026517333255873785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,8192,0.03264177838961283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,12288,0.039213332864973284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,16384,0.048469334840774536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,12288,1536,0.009306666751702627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,7168,0.029517332712809246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,10240,0.034866667456097074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,8192,0.03178755442301432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,5120,0.022498667240142822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,4096,0.018276444739765592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,7168,0.031573332018322416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,3584,0.01612444387541877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,6144,0.027746667464574177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,3072,0.014360888136757744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,5120,0.02552088929547204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,2560,0.012286221815480126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,2048,0.010686222049925061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,3584,0.020822222034136455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,1536,0.009165333376990424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,3072,0.01959822244114346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,2560,0.019090667366981506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,1024,0.007370666497283512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,2048,0.016873778568373788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,768,0.005910222315125995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,512,0.004863111095296012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,1536,0.0162453336848153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,1024,0.013902222116788229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,256,0.003993777765168084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,768,0.012992888689041138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,128,0.003297777846455574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,64,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,256,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,128,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,32,0.003141333245568805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,64,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,32,0.011401777466138205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,65536,0.17512710889180502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,65536,0.10584711366229588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,51200,0.13098488913642034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,16384,0.04567377765973409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,10240,6144,0.0262444449795617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,12288,0.032841778463787503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,51200,0.08023289177152845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,10240,0.02773422168360816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,16384,0.0362026658323076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,8192,0.02532800038655599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,12288,0.030373334884643555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,4096,0.02239377796649933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,7168,0.021799110703998145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,10240,0.027218666341569688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,6144,0.019189332922299702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,5120,0.016527111331621807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,8192,0.026946667167875502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,4096,0.014645333091417948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,7168,0.025302223033375208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,6144,0.024142222272025213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,3584,0.012421333127551608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,5120,0.021273778544531927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,3072,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,2560,0.00996977753109402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,4096,0.019303111566437613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,2048,0.00867022242810991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,1536,0.00757155567407608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,2560,0.017529777354664274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,10240,512,0.012458666331238218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,2048,0.015156444576051501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,1024,0.005605333381228977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,768,0.004578666554556953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,512,0.003536000019974179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,1536,0.013922666509946188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,1024,0.013071999781661563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,256,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,768,0.013103110922707452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,128,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,64,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,512,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,8192,32,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,128,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,64,0.011033777561452655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,32,0.011406222151385413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,65536,0.14974221918318006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,51200,0.11756443977355957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,16384,0.04206044475237528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,65536,0.09442400270038181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,12288,0.033300442828072443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,51200,0.07399644454320271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,10240,0.028187556399239436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,16384,0.03390399946106805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,8192,0.022317333353890315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,12288,0.028252445989184912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,7168,0.020495999190542433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,6144,0.017812444104088675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,10240,0.025432000557581585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,8192,0.026759111218982275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,7168,0.024134222004148696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,5120,0.015785778562227886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,3584,0.018654222289721172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,3072,0.017893332574102614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,4096,0.013904000322024027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,3584,0.012034667034943899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,6144,0.02309688925743103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,3072,0.010844444235165914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,5120,0.02086399992307027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,2560,0.009655111365848118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,4096,0.019270223047998216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,3584,0.017839110559887357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,3072,0.017872888180944655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,1536,0.007248889240953658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,1024,0.005224888937340842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,2560,0.016664889123704698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,2048,0.014785778191354541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,768,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,1536,0.013857777747843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,256,0.00319377767542998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,1024,0.012823111481136747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,128,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,768,0.012840888566441007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,64,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,512,0.012124444047609964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,256,0.011364444262451597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,32,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,128,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,64,0.011419555379284753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,65536,0.12343111303117539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,7168,32,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,16384,0.03604088889227973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,51200,0.09718755880991618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,65536,0.08752177821265326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,12288,0.028773334291246202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,51200,0.06746488809585571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,10240,0.024677332904603746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,16384,0.03236000074280633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,8192,0.021893334057595994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,12288,0.02570399973127577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,7168,0.018947554959191214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,10240,0.02310666607485877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,6144,0.017151110702090792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,8192,0.02477955487039354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,5120,0.015192000402344598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,7168,0.023696889479955036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,4096,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,6144,0.02252977755334642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,3584,0.01033333357837465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,3072,0.010020444790522257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,4096,0.01886399918132358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,2560,0.009135111338562435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,3584,0.01755466726091173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,8192,256,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,2048,0.007896888587209914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,1536,0.006746666712893381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,2560,0.01590755581855774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,2048,0.014151111245155334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,1024,0.004872000051869286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,768,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,1536,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,512,0.003576888806290097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,1024,0.012723555167516073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,256,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,768,0.012616000241703458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,128,0.002874666617976295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,512,0.012077333198653327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,64,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,256,0.011693333586057028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,6144,32,0.0025439999169773525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,128,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,64,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,65536,0.10787110858493382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,32,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,51200,0.08590844604704116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,65536,0.07912177509731717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,16384,0.03229422370592753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,7168,2048,0.008295111358165741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,12288,0.026103110777007207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,5120,0.019835554891162448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,10240,0.02221600049071842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,16384,0.0299217767185635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,8192,0.019703111714786954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,7168,0.017363554901546903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,6144,3072,0.017516444126764934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,10240,0.02215822206603156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,6144,0.015505777464972602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,5120,0.014097778333557976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,7168,0.021936888496081035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,4096,0.011979555918110741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,6144,0.021199110481474135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,3584,0.010326222413116032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,5120,0.01921599937809838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,3072,0.00942488925324546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,4096,0.018232888645595975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,2560,0.008595555192894405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,3584,0.016695110334290397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,3072,0.015818667080667283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,2048,0.007439999944633908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,2560,0.015124445160230001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,1536,0.006214222146405115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,2048,0.014117333624098035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,1024,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,1536,0.013735999663670858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,768,0.004015111260943943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,1024,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,51200,0.06203555398517185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,512,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,768,0.012466666599114736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,256,0.002942222274012036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,128,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,512,0.011445333560307821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,256,0.011735111474990845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,64,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,5120,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,8192,0.023918223049905565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,64,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,65536,0.08732977840635513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,32,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,51200,0.06827911403444079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,16384,0.027847111225128174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,12288,0.021597334080272253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,51200,0.05771288606855604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,10240,0.01904533306757609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,16384,0.026505778233210247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,12288,0.022333333889643352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,8192,0.016861332787407767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,7168,0.013869333598348828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,10240,0.02091377807988061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,6144,0.012356444365448423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,8192,0.02331999937693278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,5120,0.010820444259378644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,7168,0.02109688851568434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,4096,0.01000711073478063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,6144,0.020900444851981267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,3584,0.008839111361238692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,5120,0.018699554933442008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,3072,0.008281778130266402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,4096,0.017245334055688646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,2560,0.007268444531493717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,3584,0.015533333023389181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,2048,0.006231110956933763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,12288,0.02377066678471035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,3072,0.014831110835075378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,1536,0.005223111146026188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,2560,0.014676445060306124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,1024,0.003891555385457145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,768,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,2048,0.013818666338920593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,1536,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,512,0.0035413333939181436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,256,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,768,0.012381333443853589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,512,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,128,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,64,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,128,0.011015999648306104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,4096,32,0.002530666689078013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,64,0.011424889167149862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,65536,0.07833421892589994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,32,0.010854221880435944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,51200,0.06069866816202799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,65536,0.07017511129379272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,16384,0.02370400064521366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,51200,0.05561421977149116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,12288,0.01921955578856998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,16384,0.025054223007626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,5120,128,0.011769777370823754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,10240,0.016639999217457242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,12288,0.021760000122918025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,8192,0.014811555544535318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,7168,0.013328889177905189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,1024,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,6144,0.011938666303952536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,8192,0.021776888105604384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,5120,0.010436444646782346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,256,0.011404444773991903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,7168,0.02028888960679372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,6144,0.02032800018787384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,4096,0.009688888986905416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,3584,0.008633777499198914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,5120,0.01812622282240126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,3072,0.007841777470376756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,2560,0.006728000111050076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,3584,0.014832889040311178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,2048,0.00554666668176651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,3072,0.014468444718254937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,1536,0.00452977791428566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,2048,0.01349688900841607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,1024,0.003939555750952827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,1536,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,768,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,1024,0.012333333492279053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,512,0.0032231110251612137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,768,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,256,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,512,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,256,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,10240,0.020618667205174763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,128,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,64,0.00250133333934678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,4096,65536,0.07254933648639254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3584,32,0.002512000087234709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,128,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,64,0.011210666762457954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,65536,0.06423022349675496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,32,0.011476444701353708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,51200,0.05089955528577169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,4096,0.016152888536453247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,16384,0.02056711084312863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,65536,0.06732266479068331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,12288,0.01722133325205909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,10240,0.016749334004190233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,51200,0.0539191100332472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,16384,0.0248346659872267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3584,2560,0.014489778214030795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,12288,0.02130311065249973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,7168,0.012657778130637275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,10240,0.019896000623703003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,6144,0.011004444625642566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,5120,0.009973333113723332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,8192,0.020868443780475195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,4096,0.009343999955389235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,7168,0.01906399925549825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,3584,0.008303110798199972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,6144,0.01881511178281572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,3072,0.007283555964628856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,5120,0.016511110795868766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,2560,0.006575999988449945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,4096,0.0151591118839052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,2048,0.005555555638339784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,1536,0.004520888957712385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,3072,0.014143110977278816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,2560,0.013546666337384118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,1024,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,768,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,2048,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,512,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,1024,0.012075555821259817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,256,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,512,0.011413333316644033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,128,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,256,0.011688888900809817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,64,0.002507555608948072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,128,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,32,0.0025128889828920364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,64,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,32,0.011015111373530494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,65536,0.057709336280822754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,3072,8192,0.015111999379263984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,51200,0.0455351107650333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,16384,0.018868444694413077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,65536,0.06471733252207439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,12288,0.015881778465376962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,16384,0.024285333024130926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,10240,0.014153778553009033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,3584,0.014479999740918478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,12288,0.020959999826219346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,8192,0.012801777985360889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,7168,0.011892444557613797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,10240,0.019842666056421068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,1536,0.012433778080675336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,8192,0.019882667395803664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,6144,0.010763555765151978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,5120,0.010087110930018956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,3072,768,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,7168,0.018771555688646104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,6144,0.017636444833543565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,5120,0.015478221906556023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,3072,0.0069644442862934535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,4096,0.014456889695591398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,2560,0.005920889063013925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,3584,0.014096889230940076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,2048,0.004929777648713854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,3072,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,1536,0.004573333180612988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,2560,0.013076444466908773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,1024,0.0038604442444112566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,2048,0.013119999733236102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,768,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,1536,0.012719111310111152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,512,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,1024,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,256,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,768,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,128,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,512,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,64,0.0028071111689011254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,256,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,128,0.01109155515829722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,32,0.002528000002106031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,64,0.011750222080283694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,65536,0.05009777678383721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,51200,0.03718311256832547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,32,0.011032000184059143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,16384,0.016439111696349252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,65536,0.06208266814549764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,4096,0.008962666822804345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,12288,0.014690667390823364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2560,3584,0.007822222179836696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,51200,0.050662222835752696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,10240,0.013430222041077085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,8192,0.012311999996503195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,12288,0.02067377832200792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,10240,0.019201777047581144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,8192,0.018556444181336295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,6144,0.010429333481523724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,5120,0.00941066692272822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,7168,0.016639999217457242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,4096,0.00851111114025116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,6144,0.015497777197096082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,3584,0.007521777517265744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,5120,0.01479466590616438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,3072,0.006576889091067844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,4096,0.014200000299347771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,2560,0.005594666633341048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,3584,0.013834666874673633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2560,51200,0.05247999893294441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,2048,0.004947555561860402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,3072,0.013288000391589271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,1536,0.004558222161398994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,1024,0.003932444585694207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,2560,0.013063111239009433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,768,0.003528000166018804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,2048,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,1536,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,512,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,1024,0.01240799989965227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,256,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,128,0.0028497777465316984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,512,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,64,0.00249777775671747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,128,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,32,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,16384,0.02374222212367588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,64,0.011035555766688453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,65536,0.036602665980656944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,2048,7168,0.011223110887739392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,32,0.011367110742463006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,51200,0.02914666798379686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,16384,0.014130666851997375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,65536,0.060234665870666504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,12288,0.012509333590666452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,10240,0.01148622234662374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,51200,0.04890311095449659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,8192,0.01032977799574534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,16384,0.023199111223220825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,12288,0.020184889435768127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,10240,0.018774222996499803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,6144,0.009716444545321995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,8192,0.016671111186345417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,5120,0.008344888687133789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,7168,0.015857777661747403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,4096,0.007616000043021307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,6144,0.015578667322794596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,3584,0.0069715554515520734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,5120,0.014825777875052558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,3072,0.006251555350091722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,4096,0.013758222262064615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,2560,0.005566222386227713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,3584,0.013755555782053204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,768,0.011755555868148804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,2048,0.005231110999981563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,3072,0.013134222063753339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,1536,0.0042444442709287005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,1024,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,2048,256,0.01184177812602785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,2048,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,1536,0.012099555797047086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,512,0.0034862222770849862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,1024,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,256,0.0031786666562159858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,768,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,128,0.002573333266708586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,512,0.011428444749779172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,256,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,128,0.011120888921949597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,32,0.0025351111673646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,64,0.01166044423977534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,65536,0.02607111136118571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,32,0.01070755554570092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,51200,0.0214008887608846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,65536,0.05749866697523329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,16384,0.012452444268597497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,51200,0.047154668304655284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,12288,0.011505777637163797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,16384,0.02293155590693156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,10240,0.010281778044170803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,12288,0.019430221782790292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1536,2560,0.012797333300113678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,768,0.0035582222044467926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,10240,0.017907554904619854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,8192,0.016226665841208566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,6144,0.00868800034125646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,5120,0.008008889026112026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,6144,0.015154666370815702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,64,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,4096,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,5120,0.014474666780895658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,3584,0.006966222491529252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1536,7168,0.009362666971153682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,4096,0.013767110804716745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,3072,0.006243555496136348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,2560,0.005597333527273602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,3584,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,2048,0.006798222247097228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,3072,0.013119999733236102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,1536,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,2048,0.012506666282812754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,1024,0.004881777697139316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,1536,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,768,0.003975999852021535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,1024,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,512,0.003687111039956411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,768,0.011776888536082374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,256,0.00314666661951277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,7168,0.009686222506894005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,128,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,512,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,64,0.003015111097031169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,256,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,7168,0.01605422298113505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,128,0.012072000238630505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,65536,0.023748444186316595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,64,0.011361777782440186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,51200,0.01924088928434584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,16384,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,32,0.011078221930397881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,12288,0.011021333436171213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,65536,0.05576799975501167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,51200,0.04571466644605001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,10240,0.010074666804737514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,16384,0.021295999487241108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,12288,0.019175110591782462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,10240,0.01722133325205909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,1024,2560,0.012777778009573618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,8192,0.016169778174824186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,6144,0.008627555436558193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,5120,0.0079297779334916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,7168,0.015711999601787992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,4096,0.007262222468852997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,5120,0.01423822177780999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,3584,0.007118222614129384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,4096,0.01346933344999949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,1024,8192,0.00905600024594201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,3072,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,2560,0.005728000154097875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,3584,0.013348444468445249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,3072,0.01311644415060679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,2048,0.005209777918126848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,1536,0.005195555587609609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,2560,0.012795555922720166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,1024,0.00423911131090588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,2048,0.01237066669596566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,1536,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,768,0.0035297779573334586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,512,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,768,0.011715555356608497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,256,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,8192,0.008661333057615492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,128,0.0029155556112527847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,7168,0.009304000271691216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,256,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,64,0.0026071110947264563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,768,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,128,0.011735111474990845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,65536,0.017857778403494094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,64,0.011061333119869232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,6144,0.015134221977657743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,32,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,51200,0.01612711118327247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,16384,0.010348444183667501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,12288,0.010064000056849586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,65536,0.05513688921928406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,10240,0.009340444372759925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,51200,0.04487466812133789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,16384,0.021249777740902368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,8192,0.00829777783817715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,7168,0.008980444735950893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,10240,0.017856000198258292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,8192,0.01620444489849938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,6144,0.00832177781396442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,5120,0.00796888851457172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,7168,0.015473778049151102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,4096,0.007314666277832455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,6144,0.015186667442321777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,3584,0.006738666858938005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,5120,0.014803555276658801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,1024,0.011540444360838996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,3072,0.006600889066855113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,4096,0.013432000246312885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,2560,0.006274666637182236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,2048,0.006148444281684027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,3584,0.013403555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,768,512,0.011419555379284753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,3072,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,1536,0.00453333349691497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,2560,0.01275022245115704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,1024,0.0038684445122877755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,768,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,2048,0.012753778033786349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,1536,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,512,0.003208000005947219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,256,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,1024,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,128,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,768,0.011757333245542316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,64,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,512,0.011063999599880643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,256,0.011769777370823754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,512,32,0.0028071111689011254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,128,0.01054044481780794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,65536,0.01717511150572035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,64,0.01108977778090371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,51200,0.014902222487661572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,16384,0.00941066692272822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,32,0.01036622209681405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,12288,0.00795377790927887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,512,12288,0.018956444329685636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,65536,0.05194488830036587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,10240,0.007695111135641734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,51200,0.04281511240535312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,8192,0.006918222126033571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,16384,0.021391999390390184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,7168,0.006616888774765863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,6144,0.007295110987292395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,12288,0.018547554810841877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,5120,0.006638222270541721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,10240,0.017862222260899015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,4096,0.00627377794848548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,8192,0.016472889317406546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,7168,0.015511110424995422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,3584,0.006261333409282897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,6144,0.015160888433456421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,3072,0.005621333503060871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,2560,0.005774222314357758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,4096,0.014116444521480136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,2048,0.005562666803598404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,3584,0.013748444616794586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,1536,0.004409777621428172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,1024,0.0038213332494099936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,2560,0.012800888882742988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,2048,0.012443555725945367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,768,0.003564444267087512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,512,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,1536,0.01204355557759603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,256,0.003084444544381566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,1024,0.012373333175977072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,128,0.002509333400262727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,768,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,64,0.0025111111915773815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,512,0.011399110986126794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,256,32,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,256,0.011024889018800525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,65536,0.0147724449634552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,128,0.011720000041855706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,51200,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,64,0.01071111112833023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,32,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,16384,0.008012444608741337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,12288,0.007442666424645319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,65536,0.05063377817471822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,51200,0.042103111743927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,16384,0.020644444558355544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,8192,0.006588444527652528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,12288,0.01853511068556044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,7168,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,6144,0.006235555642180973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,10240,0.017281777328915067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,5120,0.006035555568006303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,8192,0.015968888998031616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,7168,0.015847111741701763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,4096,0.00554933316177792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,6144,0.01512888901763492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,3584,0.0059075554211934405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,5120,0.014483556151390076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,4096,0.013520888984203339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,2560,0.005903111149867375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,3584,0.013481777575280933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,5120,0.014452444182501899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,2048,0.005719999886221356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,1536,0.0042364444169733255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,256,3072,0.013453333742088742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,2560,0.01277955538696713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,1024,0.0038720000949170855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,2048,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,768,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,1536,0.012433778080675336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,1024,0.011648889217111798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,768,0.011393778026103973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,256,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,128,0.002543111021320025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,512,0.011572444604502784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,64,0.002528000002106031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,256,0.01071111112833023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,128,0.01073155552148819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,32,0.002514666567246119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,10240,0.007084444165229797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,64,0.011408000356621213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,65536,0.011230222052998014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,32,0.01035377797153261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,51200,0.01038044442733129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,16384,0.0069297779765393995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,65536,0.05095377895567152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,12288,0.006993778049945831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,51200,0.04145333170890808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,10240,0.006616000086069107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,16384,0.021262221866183813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,3072,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,8192,0.00692622239391009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,12288,0.018924444913864136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,7168,0.006589333216349284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,6144,0.006275555739800136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,10240,0.01720888912677765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,5120,0.005600888695981767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,8192,0.015819556183285184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,7168,0.015817777978049386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,4096,0.005256888767083486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,6144,0.01513066722287072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,5120,0.014452444182501899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,4096,0.01388177772363027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,3072,0.005233777893914117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,2560,0.00574933323595259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,3584,0.013576889203654395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,2048,0.005903111149867375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,3072,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,1536,0.004512000001139111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,2560,0.01272266689274046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,1024,0.0038177776667806837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,2048,0.012753778033786349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,768,0.0034862222770849862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,1536,0.01238666640387641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,512,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,1024,0.011698666546079846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,256,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,768,0.011809777882364062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,128,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,512,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,64,0.0024764444679021835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,256,0.01071911139620675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,32,0.002518222149875429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,128,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,65536,0.011384888655609555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,64,0.011085333095656501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,64,32,0.01033688916100396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,51200,0.010382222632567087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,16384,0.006986666884687211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,128,3072,0.013071111506885953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,65536,0.05064444409476387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,12288,0.006924444602595435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,10240,0.006259555617968242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,64,3584,0.005548444473081165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,16384,0.021264889174037512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,8192,0.005940444353553984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,7168,0.0059368887709246735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,12288,0.0188737776544359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,10240,0.017342221405771043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,8192,0.016224000189039443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,5120,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,7168,0.015463999576038785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,4096,0.005218666460778978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,6144,0.014771555860837301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,3584,0.005573333137565189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,5120,0.014493332968817817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,3072,0.005567111074924469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,4096,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,2560,0.005621333503060871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,3584,0.013431111143694984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,2048,0.005225777626037598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,3072,0.013416888813177744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,1536,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,2560,0.012452444268597497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,1024,0.0038622220357259116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,2048,0.0122417774465349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,768,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,1536,0.012101333174440594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,512,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,1024,0.011042666931947073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,256,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,768,0.011378666592968835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,512,0.011426666544543372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,128,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,51200,0.041402667760849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,256,0.010694222317801582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,32,0.002464888824356927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,128,0.011438222395049201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,64,0.010886222124099731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,14,32,32,0.010415111151006486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,16384,0.3234773212009006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,51200,0.5005004670884874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,16384,0.17192533281114367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,12288,0.22738578584459093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,51200,0.9750933117336698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,64,0.002475555572244856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,10240,0.18906311194101968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,128,512,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,12288,0.13072178098890516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,14,32,6144,0.0062773335311147906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,10240,0.11146488454606797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,8192,0.13613333966996935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,7168,0.13367911179860434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,6144,0.11524444156222874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,5120,0.09727199872334798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,4096,0.08054844538370769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,6144,0.09097955624262492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,5120,0.08302666743596394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,3584,0.06906044483184814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,4096,0.06745066907670763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,3072,0.06032622522777981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,2560,0.05111555589569939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,2048,0.0417208903365665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,2560,0.045026666588253446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,3072,0.057935112052493624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,3584,0.06032355626424154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,1536,0.03258666727277968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,1024,0.02362222141689724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,768,0.018783110711309645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,1536,0.03423022230466207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,2048,0.043495999442206494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,1024,0.02643999954064687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,512,0.013397333522637686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,256,0.008199111455016667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,768,0.02093422247303857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,128,0.006548444430033366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,64,0.005894222193294101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,512,0.01956355571746826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,256,0.016640888320075143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,32,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,128,0.014136888914638095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,64,0.01517511076397366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,32,0.016549333930015564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,65536,8192,0.15546400017208523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,16384,0.2759564452701145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,65536,0.5265884399414062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,51200,0.4015333387586806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,12288,0.2100151114993625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,16384,0.13993688424428305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,51200,0.8238551351759168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,12288,0.1068648894627889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,8192,0.1381502283944024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,10240,0.1746515565448337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,10240,0.09179555707507664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,8192,0.09388089179992676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,6144,0.10558399889204238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,65536,7168,0.10748800304200913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,5120,0.09037422471576267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,7168,0.08616177903281318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,7168,0.12071555190616184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,6144,0.08161155382792155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,4096,0.07283377647399902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,3584,0.06307555569542779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,5120,0.06629955768585205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,2560,0.04676444331804911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,3072,0.055952886740366616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,3584,0.050768888658947416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,3072,0.049491554498672485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,4096,0.05650044149822659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,2048,0.037979556454552546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,1024,0.02141422198878394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,768,0.016223111086421542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,1536,0.029334220621320937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,512,0.01142133358452055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,1024,0.02383822202682495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,2560,0.03812088900142246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,768,0.019088000059127808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,256,0.007322666545708974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,65536,1.0871884028116863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,64,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,512,0.01778133379088508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,256,0.014576888746685453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,32,0.003559111307064692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,128,0.013922666509946188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,32,0.01479466590616438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,65536,0.3207777871025933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,64,0.013891556196742587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,51200,0.2494435575273302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,65536,0.18780710962083605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,16384,0.09123822053273518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,12288,0.07077866792678833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,51200,0.1422613329357571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,10240,0.05312711000442505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,1536,0.029422223567962646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,12288,0.0452497767077552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,16384,0.05634399917390612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,8192,0.04406933320893181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,51200,2048,0.03764977720048692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,10240,0.04032355546951294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,6144,0.03293955657217238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,8192,0.04287022352218628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,5120,0.029048889875411987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,7168,0.03866399990187751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,51200,128,0.004202666795916027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,6144,0.036526223023732506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,3584,0.02160533269246419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,4096,0.024102222588327196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,3072,0.018567111757066514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,5120,0.03635288940535651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,2560,0.01612977849112617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,4096,0.02684266699684991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,3584,0.025133333272404138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,1536,0.01093777765830358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,3072,0.024295111497243244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,2560,0.02128622266981337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,2048,0.020000000794728596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,768,0.006892444358931647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,1536,0.018156444032986958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,512,0.00490133340160052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,1024,0.015810666812790763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,256,0.0032319999817344877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,768,0.013934221532609729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,128,0.0028826666788922418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,512,0.01312444441848331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,64,0.002793777734041214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,256,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,128,0.011424000064531961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,64,0.011537777880827585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,16384,32,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,7168,0.03851111067665948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,65536,0.25284889009263783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,65536,0.15876532925499812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,51200,0.20019822650485566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,16384,0.06710311439302233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,12288,0.05236355463663737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,16384,0.05014488763279385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,2048,0.013316444224781461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,10240,0.04486933350563049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,8192,0.037535998556349016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,16384,1024,0.008623999853928884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,10240,0.03629422187805176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,7168,0.03298844562636481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,6144,0.029115554359224107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,8192,0.03837066557672288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,5120,0.02567911148071289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,7168,0.03502488798565335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,4096,0.02058577703105079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,3584,0.017820444371965196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,6144,0.03375644485155741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,5120,0.027886221806208294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,3072,0.015697777271270752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,4096,0.025573333104451496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,2560,0.013222222526868185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,3584,0.023225777679019507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,2048,0.011436444189813403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,3072,0.022851554883850947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,1536,0.00962933318482505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,2560,0.019333332777023315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,1024,0.007875555919276344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,2048,0.01919644408755832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,1536,0.016912000046836007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,512,0.004514666481150521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,1024,0.014436443646748861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,256,0.004014222158326043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,512,0.013068444199032254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,128,0.003192000091075897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,51200,0.12285689512888591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,256,0.011732444167137146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,64,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,32,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,128,0.011350221931934357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,64,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,12288,0.04060711132155524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,32,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,65536,0.2184657785627577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,51200,0.1720284488466051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,65536,0.15056444538964167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,16384,0.0600151088502672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,51200,0.11776799625820583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,12288,0.046880000167422824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,10240,0.03836977812978957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,8192,0.03262933426433139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,16384,0.04817600051561991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,10240,0.035409778356552124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,7168,0.02907199992073907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,12288,0.03901066713862949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,8192,0.03281599945492215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,6144,0.026016889346970454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,5120,0.022908444205919903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,12288,768,0.006232888748248418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,4096,0.018539556198649935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,7168,0.030989332331551447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,3584,0.015790222419632804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,3072,0.014383999837769402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,6144,0.026345777842733595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,2560,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,5120,0.02432800001568264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,4096,0.02241155505180359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,12288,768,0.013413333230548434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,2048,0.011001778145631155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,3584,0.021319111188252766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,1536,0.009175111022260454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,1024,0.007655999726719326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,3072,0.02056711084312863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,512,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,2048,0.017510222064124215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,1024,0.014115555418862237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,256,0.0037457777394188773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,768,0.013764444324705334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,128,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,512,0.013049778011110095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,64,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,256,0.011426666544543372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,32,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,128,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,64,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,32,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,65536,0.17400977346632215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,51200,0.13086667325761583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,65536,0.10379644234975179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,16384,0.0458222230275472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,51200,0.08001955350240071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,12288,0.032660444577534996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,16384,0.03713422351413303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,10240,0.027455111344655354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,8192,0.02476799984773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,12288,0.030116445488399927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,7168,0.021693333983421326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,10240,0.027052443888452318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,10240,768,0.00589155571328269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,6144,0.01897333396805657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,8192,0.027058665951093037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,5120,0.016694222887357075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,1536,0.016191111670600045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,7168,0.02565066681967841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,3584,0.012491555677519904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,4096,0.014774221513006421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,6144,0.023524444964196947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,3072,0.011409777734014722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,2560,0.009853333234786987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,2048,0.008574222524960836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,3584,0.019282667173279654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,3072,0.01794488893614875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,1536,0.007344889144102733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,2560,0.017183999220530193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,1024,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,2048,0.015783111254374187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,768,0.004416000097990036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,512,0.0038328886859946777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,1536,0.014094221923086377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,256,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,768,0.012780444489585029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,1024,0.013071999781661563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,128,0.003141333245568805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,64,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,256,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,8192,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,128,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,64,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,32,0.011387555963463254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,65536,0.15006221665276423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,51200,0.1169511079788208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,65536,0.09460800223880345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,16384,0.04197600152757433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,10240,2560,0.018251554833518136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,51200,0.07346577776802911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,12288,0.03325066632694668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,16384,0.03417333298259311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,10240,0.028295109669367473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,8192,0.021743999587164983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,5120,0.020755555894639757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,4096,0.01925155520439148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,6144,0.017882666654056974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,10240,0.024898666474554274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,8192,0.026047110557556152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,5120,0.015784889459609985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,4096,0.013732444081041547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,6144,0.022435555855433147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,3584,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,5120,0.020541333489947848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,4096,0.01955200069480472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,3072,0.010949333508809408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,8192,512,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,2560,0.009477333062224919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,3584,0.018576888574494254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,2048,0.008282666405042013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,1536,0.007284444239404466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,3072,0.01777777738041348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,1024,0.00555377784702513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,2560,0.016594666573736403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,2048,0.014781332678265043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,768,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,512,0.0036275556517971885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,1536,0.014154665999942355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,256,0.0032711111836963226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,1024,0.012757333616415659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,128,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,768,0.012710221939616732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,512,0.012423999607563019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,256,0.011747555600272285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,32,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,128,0.011026666396194033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,64,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,32,0.011780444118711682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,65536,0.12303377522362603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,7168,0.020548444655206468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,65536,0.08803733189900716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,16384,0.03587111168437534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,7168,0.02440799938307868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,51200,0.06726400057474773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,16384,0.031890667147106595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,10240,0.02477688921822442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,12288,0.025980444418059453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,8192,0.02158755560715993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,10240,0.023020444644822016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,7168,0.019253333409627277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,8192,0.025568000144428674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,6144,0.016913778252071805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,7168,0.02382044494152069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,7168,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,6144,0.021934222843911912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,5120,0.015102222561836243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,4096,0.011507555842399597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,3584,0.010370666782061258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,5120,0.019314666589101154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,4096,0.018230222993426852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,3072,0.010013333625263637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,2560,0.008999110923873054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,3584,0.018427555759747822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,7168,12288,0.02812888887193468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,2048,0.007993777592976889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,3072,0.01739377776781718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,1536,0.0069226668112807805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,51200,0.09732800059848362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,1024,0.004473777694834603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,2560,0.015504888362354703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,768,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,512,0.003555555724435382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,2048,0.01428533262676663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,1536,0.013795555465751223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,256,0.003216000066863166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,128,0.002855111120475663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,768,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,1024,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,64,0.0028026666906144884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,32,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,512,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,256,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,128,0.01072799993885888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,64,0.011071110765139261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,6144,32,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,51200,0.08581778075959946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,16384,0.032215111785464816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,65536,0.07825689183341132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,12288,0.026030222574869793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,10240,0.022224000758594934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,16384,0.029782222376929388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,8192,0.019839111301634047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,12288,0.023690667417314317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,10240,0.02203111184967889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,7168,0.017147555947303772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,6144,0.015544000599119397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,8192,0.02410488824049632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,5120,0.01382844481203291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,7168,0.02269422180122799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,4096,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,3584,0.010637332995732626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,5120,0.019296000401178997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,4096,0.018184888694021437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,3072,0.009347555538018545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,2560,0.008370666868156856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,3584,0.01754488878779941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,2048,0.007600000335110559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,3072,0.016195555528004963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,1536,0.00591822216908137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,2048,0.014446222119861178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,6144,12288,0.02923999892340766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,1024,0.0042071110672420925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,768,0.0042053332759274375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,1536,0.013595555391576556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,512,0.003539555602603488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,1024,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,256,0.0032337777730491427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,768,0.012768000364303589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,65536,0.10787644651201035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,512,0.01180266671710544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,64,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,256,0.011056889262464313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,51200,0.06146133608288235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,32,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,128,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,64,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,65536,0.0860897766219245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,32,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,16384,0.02750844425625271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,65536,0.07174933618969388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,6144,0.020865778128306072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,12288,0.021497777766651575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,51200,0.05745066536797417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,16384,0.026312889324294195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,10240,0.01920977731545766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,8192,0.016512889001104567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,12288,0.022184888521830242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,7168,0.01386044422785441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,10240,0.02068622244728936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,8192,0.021718222233984206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,5120,2560,0.014825777875052558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,5120,0.011000889043013254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,7168,0.021299555897712708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,4096,0.01036888857682546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,6144,0.01993777851263682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,3584,0.008962666822804345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,5120,0.017893332574102614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,4096,0.017210667332013447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,3072,0.008263111114501953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,3584,0.016170667277442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,2560,0.007291555404663086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,2048,0.005872888697518243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,5120,128,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,1536,0.004564444637960858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,3072,0.014831999937693277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,1024,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,2560,0.014150222142537435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,2048,0.013567110730542077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,768,0.003559999995761447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,512,0.003527111063400904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,1536,0.013436444103717804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,256,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,1024,0.012090666426552666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,51200,0.0679911110136244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,768,0.012423999607563019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,64,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,512,0.011713777979214987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,32,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,256,0.011502222054534487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,128,0.011384000380833944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,65536,0.07817333274417453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,32,0.010749333434634738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,51200,0.060681780179341636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,16384,0.023774221539497375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,65536,0.06867911418279012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,6144,0.01236533373594284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,12288,0.01905955539809333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,51200,0.05538488758934868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,10240,0.01684799955950843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,8192,0.014589332871966891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,16384,0.02532977859179179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,12288,0.021627555290857952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,7168,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,6144,0.01201333353916804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,8192,0.02187999917401208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,7168,0.020263110597928364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,5120,0.010415111151006486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,4096,0.00980888886584176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,6144,0.01945244438118405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,3584,0.008637333081828224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,5120,0.017849778135617573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,3072,0.007975111405054728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,4096,0.016179554992251925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,2560,0.006950221955776215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,3584,0.015253333581818474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,2048,0.005696889013051987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,3072,0.014787554740905762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,4096,128,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,1536,0.004512888689835866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,2560,0.013821333646774292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,1024,0.004054222255945206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,768,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,2048,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,512,0.0033537778589460584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,1536,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,1024,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,4096,64,0.011762667033407422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,256,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,768,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,64,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,512,0.01237511138121287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,32,0.0028515555378463534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,128,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,64,0.011356444822417365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,65536,0.06345422400368585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,32,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,51200,0.05067822337150574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,16384,0.0206675562593672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,10240,0.02039377722475264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,65536,0.06687733199861315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,12288,0.017200888858901132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,51200,0.05404000149832832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,10240,0.01696711116366916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,8192,0.014997333288192749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,16384,0.024728889266649883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,12288,0.02125955621401469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,7168,0.012588444683286877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,10240,0.020202666521072388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,6144,0.011223999990357293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,5120,0.010042666561073726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,8192,0.02051111062367757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,7168,0.019564444820086162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,4096,0.009016888837019602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,3584,0.00829777783817715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,6144,0.01789155602455139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,3072,0.007627555893527136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,5120,0.016319110989570618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,2560,0.006288888967699475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,4096,0.015468445089128284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,2048,0.005535999933878581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,3584,0.014549333188268872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,3072,0.014136888914638095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,2560,0.013763555222087435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,2048,0.013413333230548434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3584,128,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,1024,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,768,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3584,256,0.011007111105653973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,1536,0.01277599980433782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,512,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,1024,0.012082666986518435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,768,0.012077333198653327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,512,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,256,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,64,0.00263288886182838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,128,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,32,0.002842666581273079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,64,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,3072,32,0.010737777584128909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,65536,0.06390221913655598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,51200,0.0452497767077552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,1536,0.004567999806669024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,51200,0.05213333169619242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,16384,0.018775110443433125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,12288,0.015629332926538255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,256,0.0028479999552170434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,16384,0.024280889166726008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,10240,0.0144213338692983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,12288,0.021345777644051447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,8192,0.012895111408498553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,7168,0.011912888950771756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,10240,0.01957155598534478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,8192,0.019903999235894945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,6144,0.011113777756690979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,5120,0.010223999619483948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,7168,0.018575110369258456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,4096,0.008708444734414419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,6144,0.017143110434214275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,3584,0.00794488853878445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,5120,0.01512888901763492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,65536,0.057526224189334445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,3072,0.006978666616810693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,4096,0.014674666855070325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,2560,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,2048,0.005249777601824866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,3584,0.01445777714252472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,1536,0.004514666481150521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,3072,0.01406133340464698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,1024,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,2560,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,768,0.0038319999972979226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,512,0.0032248888164758682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,1536,0.01275288893116845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,256,0.0028515555378463534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,512,0.011422221859296164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,128,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,256,0.011448889142937131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,64,0.0025128889828920364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,128,0.011067555182509951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2560,32,0.0025351111673646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,3072,128,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,64,0.011774222056070963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,65536,0.051197333468331226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,32,0.010796444283591377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,51200,0.037257777320014104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,65536,0.061604446834988065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,51200,0.05044000016318428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,12288,0.014670222997665405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,16384,0.02402577797571818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,10240,0.013297778036859302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,12288,0.020818667279349435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,8192,0.01220266686545478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,10240,0.019527999891175162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,2048,0.013099555340078143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,7168,0.01110311100880305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,6144,0.010694222317801582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,8192,0.019487111104859244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,1024,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2560,768,0.012049777640236748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,5120,0.009648888475365108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,4096,0.00814577771557702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,3584,0.007251555720965068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,7168,0.016943999462657504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,3072,0.006257777826653586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,6144,0.015836444165971544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,5120,0.014724445011880664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,2560,0.005919999960396025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,4096,0.014381332529915703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,2048,0.0052426668504873914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,3584,0.014104889498816596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,1536,0.004390222330888112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,3072,0.013577777478430005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,1024,0.0038764443662431505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,2560,0.013408888545301227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,768,0.0035866668654812705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,2048,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,512,0.003198222153716617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,1536,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,256,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,1024,0.01238222254647149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,128,0.0028826666788922418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,768,0.012427555190192329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,512,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,64,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,256,0.011003555523024665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,2048,16384,0.0165955556763543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,128,0.011507555842399597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,65536,0.03631555702951219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,51200,0.029457777738571167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,32,0.010752889017264048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,16384,0.013785777820481194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,12288,0.012894222305880653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,51200,0.04911199874348111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,10240,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,16384,0.023123555713229712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,8192,0.010071111222108206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,12288,0.02060622142420875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,7168,0.009657777845859528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,10240,0.018765333626005385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,6144,0.010029333333174387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,8192,0.016540444559521146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,5120,0.008650666309727563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,7168,0.016143111719025504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,4096,0.007638221813572778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,6144,0.015790222419632804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,3584,0.006976889239417181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,5120,0.014472888575659858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,3072,0.006329777754015393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,4096,0.014113777213626437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,2560,0.00562755556570159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,3584,0.014128888646761576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,2048,0.004910222358173794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,3072,0.01311822235584259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,1536,0.004567999806669024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,2560,0.013437333206335703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,1024,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,2048,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,768,0.003641777982314428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,2048,64,0.010687111152542962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,1024,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,512,0.0032239999208185407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,768,0.012431110772821637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,65536,0.05989333656099108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,128,0.0028862222615215513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,512,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,64,0.0024871110088295406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,256,0.011511999699804517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,32,0.00254133323000537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,128,0.011020444333553314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,65536,0.025915554828113977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,64,0.011361777782440186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,51200,0.021351999706692163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,32,0.011396444506115384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,16384,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,12288,0.011690666278203329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,65536,0.05702755848566691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,51200,0.04600711001290215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,10240,0.010029333333174387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,16384,0.02275111112329695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,8192,0.009300444689061906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,7168,0.009378666679064432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,10240,0.017862222260899015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,6144,0.009015999734401703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,7168,0.015801777442296345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,5120,0.007676444119877285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,6144,0.01536799967288971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,4096,0.007596444752481248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,5120,0.014602666099866232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,3584,0.006909333169460297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,4096,0.014045332868893942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1536,256,0.002963555562827322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,3072,0.006302222195598815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,2560,0.005566222386227713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,3584,0.013805333111021252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,2048,0.006607111129495833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,3072,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,1536,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,2560,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,1024,0.004888888862397936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,2048,0.012664889295895895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,768,0.004219555606444676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,1536,0.01238933371173011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,512,0.0035537779331207275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,1024,0.012101333174440594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,256,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,768,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,128,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,512,0.011555555793974133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,12288,0.01888177792231242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,64,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,256,0.011658666862381829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,1024,32,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,8192,0.016524444023768108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,65536,0.023544000254737005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,51200,0.01923733287387424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,32,0.011077333655622272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,16384,0.011307555768224927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,65536,0.056031107902526855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1536,1536,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,51200,0.045500444041358105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,16384,0.021292444732454088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,10240,0.009896888501114314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,12288,0.01904622217019399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,8192,0.008338666624493068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,10240,0.017806222041447956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,7168,0.009157333109113906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,8192,0.016191111670600045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,6144,0.008648888932334052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,7168,0.015843555331230164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,5120,0.007956444389290279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,6144,0.015171556009186639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,4096,0.007254222200976477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,5120,0.014789332946141561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,3584,0.0069360000391801195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,4096,0.013798221945762634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,3072,0.006230222268237009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,128,0.01090311093462838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,2560,0.005581333405441708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,3584,0.014094221923086377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,1024,64,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,2048,0.005220444252093633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,1536,0.005033777819739448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,2560,0.013060444758998023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,12288,0.01108000013563368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,1536,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,768,0.003559999995761447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,512,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,1024,0.012234666281276278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,256,0.002967111145456632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,768,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,128,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,512,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,64,0.002502222235004107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,256,0.011384888655609555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,32,0.0025128889828920364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,128,0.011028444601429833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,64,0.01143022212717268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,32,0.01146311147345437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,51200,0.015995555453830294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,65536,0.05443911088837517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,16384,0.010326222413116032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,51200,0.045428444941838585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,12288,0.010253333383136326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,16384,0.021336888273557026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,3072,0.013054221868515015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,12288,0.01923466722170512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,8192,0.007978666987684038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,768,2048,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,10240,0.017455110947291057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,7168,0.008672888908121321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,6144,0.008293333152929941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,8192,0.016567111015319824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,7168,0.015791111522250705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,6144,0.01499288943078783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,4096,0.0070426662762959795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,5120,0.014114666316244336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,3584,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,4096,0.013456000222100152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,3072,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,65536,0.017483555608325534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,2560,0.006303999986913469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,3584,0.013439999686347114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,2048,0.005931555396980709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,3072,0.013351110948456658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,1536,0.0042453333735466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,2560,0.012811555630630918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,1024,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,2048,0.012084444363911947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,768,0.003536000019974179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,1536,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,512,0.0031928889867332247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,1024,0.011583999627166323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,10240,0.008958222137557136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,256,0.0031848889258172777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,128,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,512,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,768,1024,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,256,0.011459555890825061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,64,0.011039999624093374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,5120,0.007909333540333642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,32,0.011190222369299995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,51200,0.014838222000333997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,65536,0.053207112683190234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,16384,0.009352000223265754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,51200,0.042768889003329806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,12288,0.008349333372380998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,16384,0.02128177715672387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,10240,0.007599111232492659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,12288,0.019222221440739103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,8192,0.0069253332912921906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,10240,0.017865777015686035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,8192,0.01644088824590047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,768,0.011406222151385413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,6144,0.0069413334131240845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,7168,0.015812445018026564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,5120,0.006687110910813014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,512,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,4096,0.00589155571328269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,512,128,0.010482666393121084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,3584,0.005879999862776862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,6144,0.015127110812399121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,3072,0.005930666708283954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,5120,0.014670222997665405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,2560,0.006281777802440856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,65536,0.01718222267097897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,3584,0.013761777844693927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,2048,0.005294222384691238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,3072,0.012999110751681857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,1536,0.004540444248252445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,1024,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,2048,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,768,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,1024,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,512,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,768,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,256,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,512,0.011427555647161273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,128,0.0028826666788922418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,256,0.01106844428512785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,7168,0.006828444285525217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,64,0.002518222149875429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,256,32,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,128,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,65536,0.014821334017647637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,64,0.011863110793961419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,32,0.011013333168294696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,51200,0.01276000009642707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,16384,0.008064889245563084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,65536,0.05050666795836555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,12288,0.007672000262472365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,51200,0.04177511069509718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,16384,0.021280889709790547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,4096,0.014124444789356656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,8192,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,12288,0.018467555443445843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,7168,0.006295111030340195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,2560,0.01344622257683012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,10240,0.01787911189926995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,6144,0.006321777900060018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,5120,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,256,1536,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,7168,0.015471110741297403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,4096,0.0058711109062035876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,6144,0.01519466605451372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,3584,0.005928888916969299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,5120,0.014430221584108142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,4096,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,2560,0.005614222337802251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,3584,0.013889777991506787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,2048,0.005973333285914526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,3072,0.013312000367376538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,1536,0.004516444272465176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,2560,0.012788444757461548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,1024,0.004023111114899318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,1536,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,768,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,1024,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,512,0.003170666595300039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,768,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,256,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,512,0.011415999796655444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,10240,0.0069653333889113525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,128,0.0025235555238193935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,64,0.0025519999778932994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,256,0.011387555963463254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,32,0.002524444419476721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,128,0.010684444672531553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,64,0.011031111081441244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,8192,0.016140444411171805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,32,0.010696888797812991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,51200,0.010596444209416708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,16384,0.006991110742092133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,12288,0.00674933319290479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,65536,0.05032799972428215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,10240,0.006222222414281633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,128,3072,0.005698666804366642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,51200,0.041476445065604314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,16384,0.020947555700937908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,8192,0.00627377794848548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,7168,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,12288,0.0185244447655148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,6144,0.005543111099137201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,10240,0.01722577710946401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,5120,0.005559999909665849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,8192,0.016170667277442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,4096,0.005208888815508948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,7168,0.015452444553375244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,3584,0.005603555589914322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,6144,0.014839111102951897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,3072,0.00526577772365676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,5120,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,2560,0.00592533333433999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,4096,0.013873777455753751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,2048,0.005224888937340842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,3584,0.013454222016864352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,1536,0.004239999999602635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,3072,0.012917333179050021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,1024,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,2560,0.012814222110642327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,768,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,2048,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,1536,0.012086222569147745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,512,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,256,0.002961777771512667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,1024,0.01142133358452055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,768,0.012155555188655853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,128,0.002491555487116178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,64,0.002485333424475458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,512,0.011407111254003314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,32,0.00253866674999396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,128,0.01073066641887029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,64,65536,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,65536,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,51200,0.010123555858929953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,32,0.010679110884666443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,16384,0.006568888823191325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,65536,0.05061777763896518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,51200,0.04144533475240072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,12288,0.007284444239404466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,16384,0.02091377807988061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,10240,0.0069155556460221606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,8192,0.006569777925809224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,12288,0.018254222141371835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,10240,0.017197334104114108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,7168,0.005964444329341252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,6144,0.005550222264395819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,8192,0.016160888804329764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,5120,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,128,2048,0.013032000097963544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,4096,0.005497777627574072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,7168,0.015454222758611044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,6144,0.014783999986118741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,3584,0.005583111196756363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,5120,0.014463999205165438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,4096,0.014157333307796054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,3584,0.013634666800498962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,3072,0.01312711089849472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,2048,0.005583111196756363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,2560,0.013064888616402945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,256,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,1536,0.004201777693298128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,1024,0.0038204445607132385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,2048,0.012720888687504662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,64,64,0.010761777559916178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,768,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,512,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,1536,0.012492444780137805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,256,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,1024,0.011371555427710215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,768,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,512,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,256,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,32,0.0024782222592168385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,128,0.01075466639465756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,64,0.011400889191362592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,13,32,32,0.011434666812419891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,3072,0.0052693333062860705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,2560,0.005941333456171884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,51200,0.4985653559366862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,16384,0.32342667049831814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,16384,0.17127733760409883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,51200,0.9686213599310981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,13,32,128,0.0025759999536805684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,12288,0.2271724541982015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,12288,0.1300168832143148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,10240,0.1886577738655938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,8192,0.15515289041731092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,8192,0.12115555339389378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,7168,0.13372088803185359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,7168,0.10838666889402603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,10240,0.128912885983785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,6144,0.11536444558037652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,16384,0.19038844108581543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,10240,0.13754933410220677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,12288,0.1472862164179484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,8192,0.10912622345818414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,5120,0.09716711441675822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,4096,0.08161955409579806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,5120,0.0832586685816447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,7168,0.09836266438166301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,4096,0.06868710782792833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,3584,0.06190222501754761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,5120,0.07813777526219685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,6144,0.08870222171147664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,4096,0.06805600060356988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,3072,0.06015377574496799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,2560,0.050929778152041964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,3072,0.05807822280459934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,2560,0.0491484436723921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,3584,0.06247911188337538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,3072,0.05843200286229452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,2048,0.04225066635343763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,2560,0.052419556511773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,2048,0.04256622327698601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,6144,0.10638399918874104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,1024,0.02360800074206458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,2048,0.04742133286264208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,1024,0.023972445064120825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,3584,0.06923644410239325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,1536,0.034918222162458636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,1024,0.03504088852140639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,768,0.01862044466866387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,512,0.013564444250530668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,768,0.023286221755875483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,512,0.019355555375417072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,256,0.008347555167145198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,512,0.02943555514017741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,256,0.02621511121590932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,128,0.0069066666894488865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,128,0.014801777071423002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,1536,0.032815112007988825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,64,0.005910222315125995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,128,0.021645334031846788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,65536,32,0.005894222193294101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,32,0.016151999433835346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,1536,0.04179199867778354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,768,0.03193777799606323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,65536,51200,0.5253751013014052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,256,0.01579466627703773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,65536,0.5252879990471734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,51200,0.40062310960557723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,16384,0.2762755552927653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,65536,1.0872391594780815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,51200,0.8465982013278537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,16384,0.13938755459255642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,65536,64,0.015124445160230001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,12288,0.20877688460879854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,10240,0.17411911487579346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,12288,0.10652533504698013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,8192,0.13998577329847547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,10240,0.1094213326772054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,8192,0.0964311096403334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,7168,0.12443199422624375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,12288,0.12339822451273601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,10240,0.10679466856850518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,16384,0.15671200222439235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,7168,0.08450488911734687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,6144,0.10490400261349148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,5120,0.08993066681755914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,8192,0.09330222341749404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,6144,0.07793511284722222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,4096,0.07297599977917142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,7168,0.08459999826219346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,5120,0.0701084468099806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,3584,0.06373155779308744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,4096,0.0569173362520006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,5120,0.06839288605584039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,3584,0.05186311072773404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,4096,0.059824890560574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,3584,0.05606844690110949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,3072,0.04516888989342583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,2560,0.04704622096485562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,2560,0.04219466778967115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,3072,0.05231822199291653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,2048,0.03806133402718438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,2560,0.047091556919945605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,1536,0.029931555191675823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,2048,0.033377776543299355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,2048,0.04388799932267931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,1024,0.02139288849300808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,1536,0.029892444610595703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,1536,0.04011111127005683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,6144,0.07570666737026639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,1024,0.02331200076474084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,768,0.015601777368121676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,1024,0.031297776434156634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,512,0.01110222190618515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,768,0.02997777859369914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,768,0.02019733356104957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,512,0.02891555428504944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,512,0.017418666018380057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,256,0.007594666547245449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,128,0.0041662222809261745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,256,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,64,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,128,0.012797333300113678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,32,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,64,0.014103111293580798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,51200,32,0.014635556273990206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,51200,0.4134959909651015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,65536,0.32019734382629395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,65536,0.182824002371894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,51200,0.24938133027818468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,51200,0.14204088846842447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,51200,3072,0.055890666113959424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,16384,0.09114488628175522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,256,0.023696889479955036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,128,0.020516445239384968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,12288,0.07110222180684407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,12288,0.04480088750521342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,10240,0.05406844284799364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,16384,0.07039999961853027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,10240,0.047304888566335045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,12288,0.059843553437127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,8192,0.04456444581349691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,8192,0.04447911183039347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,7168,0.03829955392413669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,8192,0.04950755503442553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,10240,0.05325422353214688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,51200,65536,0.5383626619974772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,6144,0.0336497790283627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,65536,0.19696444935268828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,7168,0.04831022355291578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,5120,0.02884888980123732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,6144,0.03702133231692844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,16384,0.05669244130452474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,6144,0.04343644446796841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,4096,0.024634665913052026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,5120,0.03268977668550279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,3584,0.021242666575643752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,4096,0.028816888729731243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,3584,0.02607911162906223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,3584,0.035306665632459856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,3072,0.024636444118287828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,3072,0.03310844302177429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,2560,0.015915556086434256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,2560,0.03184177809291416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,2560,0.022300443715519373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,2048,0.013046222428480784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,2048,0.019487111104859244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,7168,0.03986488779385885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,1536,0.018178666631380718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,51200,0.1561111079321967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,1536,0.029297779003779095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,1024,0.00828888929552502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,5120,0.040468444426854454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,768,0.0069191112286514705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,3072,0.018587556150224473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,1024,0.02533600065443251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,512,0.004920888692140579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,768,0.02379200028048621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,512,0.01274222218328052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,512,0.022870222727457683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,256,0.0033253334048721525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,256,0.021334222621387903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,128,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,256,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,2048,0.02956355611483256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,128,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,64,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,32,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,32,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,1024,0.015695111619101632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,16384,768,0.014096889230940076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,65536,0.25193601184421116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,65536,0.1571226649814182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,51200,0.19818666246202257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,51200,0.12258044878641765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,16384,0.06746933195326063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,64,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,16384,0.05030311147371928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,12288,0.05240355597601997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,16384,0.061349332332611084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,12288,0.04031199879116482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,4096,0.03554933269818624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,10240,0.05006222261322869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,12288,0.051338666015201144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,65536,0.15585245026482478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,51200,0.1248026688893636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,10240,0.04686222142643399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,8192,0.039677331844965615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,7168,0.03289244572321574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,16384,128,0.020998222960366145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,6144,0.02895911203490363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,8192,0.04408266809251574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,7168,0.03593511051601834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,7168,0.0404079986943139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,5120,0.025389333566029865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,6144,0.03145155641767714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,4096,0.020082667469978333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,6144,0.03882666760020786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,5120,0.02864355511135525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,5120,0.03658755620320638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,3584,0.017477333545684814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,4096,0.026424888107511733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,4096,0.03344088792800903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,10240,0.044687112172444664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,3072,0.015473778049151102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,3584,0.03293155630429586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,2560,0.013109332985348172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,3584,0.024403555525673762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,3072,0.02187555531660716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,2048,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,2560,0.020850666695170935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,2560,0.030319998661677044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,1536,0.009671111073758867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,2048,0.02864977717399597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,8192,0.03735555542839898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,1024,0.007648888561460707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,1536,0.017350221673647564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,1536,0.0273333340883255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,768,0.006559999866618051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,1024,0.025065778030289546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,1024,0.013426666458447775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,512,0.004530666602982415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,768,0.02330488959948222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,16384,1536,0.010674667027261523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,512,0.021715554926130507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,256,0.011973333027627734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,512,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,128,0.0032186667538351486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,256,0.022655111220147874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,128,0.011427555647161273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,128,0.021299555897712708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,64,0.0031893334041039148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,32,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,64,0.01241422196229299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,12288,3072,0.03200088938077291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,32,0.010919111470381418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,2048,0.019001776973406475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,65536,0.21646666526794434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,65536,0.14949156178368464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,51200,0.17273688316345215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,12288,768,0.013436444103717804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,16384,0.059177776177724205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,51200,0.11795022752549912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,12288,0.04658133453792996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,16384,0.04758933186531067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,12288,0.03910577628347609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,10240,0.03850933247142368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,16384,0.05539555682076348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,12288,0.047545777426825635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,8192,0.032229334115982056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,10240,0.04066133168008592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,7168,0.029285334878497656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,10240,0.04500088757938809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,51200,0.11284000343746609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,8192,0.032976888948016696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,65536,0.14174666669633654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,6144,0.026180444492234126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,8192,0.04159911142455207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,5120,0.022357333037588332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,7168,0.03095910946528117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,7168,0.03930400146378411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,5120,0.025051555699772302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,6144,0.03686133358213637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,5120,0.03531377845340305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,3584,0.015971556305885315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,4096,0.022448889083332483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,4096,0.03273777829276191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,3072,0.01442488862408532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,12288,256,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,3584,0.03185333477126227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,3584,0.02106133268939124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,2560,0.012482666307025485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,2048,0.01107377807299296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,3072,0.030975110001034204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,3072,0.019903999235894945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,2560,0.030252443419562444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,2560,0.019225777851210702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,1536,0.008955555657545725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,2048,0.027598222096761067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,1024,0.007594666547245449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,2048,0.017516444126764934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,1536,0.016171556380059984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,1536,0.027076444692081873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,768,0.0059004442559348206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,1024,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,512,0.004586666822433472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,1024,0.021917333205540974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,256,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,768,0.022330666581789654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,768,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,128,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,512,0.022640888889630634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,512,0.012378666963842181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,64,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,256,0.021264889174037512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,256,0.011382222175598145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,32,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,10240,128,0.020634666085243225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,128,0.011687999798191918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,64,0.011404444773991903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,32,0.010739555789364709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,10240,6144,0.027913779020309448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,65536,0.17500178019205728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,65536,0.10191822052001953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,51200,0.13064800368414983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,16384,0.045372443066702954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,51200,0.07962044742372301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,12288,0.03291911217901442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,16384,0.036419557200537786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,10240,0.02773422168360816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,12288,0.029915554655922785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,16384,0.05229422118928698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,8192,0.025039111574490864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,12288,0.04570666617817349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,10240,0.03268622358640035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,10240,0.043997334109412305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,7168,0.021858667333920796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,8192,0.02677333354949951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,6144,0.018978666928079393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,8192,0.039876444472206965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,51200,0.10628177722295125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,7168,0.024442666106753882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,65536,0.1293555498123169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,5120,0.016581333345837064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,7168,0.03872977693875631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,6144,0.02299733294381036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,6144,0.0358862214618259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,4096,0.01384800010257297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,3584,0.01241422196229299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,5120,0.020929776959949072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,4096,0.03183822168244256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,4096,0.019532443748580087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,3072,0.011390222443474663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,3584,0.031030221117867365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,3584,0.018420444594489205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,2560,0.009927999642160203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,3072,0.017507554756270517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,2048,0.008489777644475302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,2560,0.01699822147687276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,2048,0.015698666373888653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,2048,0.028190222051408555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,1536,0.007293333609898885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,1536,0.02488800055450863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,1536,0.014485332700941296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,1024,0.00552977787123786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,1024,0.012799111505349478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,1024,0.021724444296624925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,768,0.004831111265553368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,768,0.01238666640387641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,768,0.021939555803934734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,512,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,5120,0.0343413319852617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,256,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,512,0.021002666817771062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,512,0.011891555454995898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,128,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,10240,4096,0.018564444449212816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,256,0.020580444071027968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,256,0.011768889096048145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,128,0.01072622256146537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,128,0.020961778031455144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,2560,0.02865511178970337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,64,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,8192,32,0.011037333144081963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,65536,0.14883200327555338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,65536,0.09502400292290582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,51200,0.11722489198048909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,16384,0.0418817765182919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,51200,0.07313333617316352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,16384,0.03395466672049628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,12288,0.03353155652681986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,16384,0.05256444546911451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,12288,0.02813777658674452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,10240,0.028139554791980322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,65536,0.12830844190385607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,12288,0.04608444372812907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,51200,0.10623644457923041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,8192,0.02180888917711046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,10240,0.031215111414591473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,8192,3072,0.03031733300950792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,10240,0.0432604451974233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,7168,0.020392000675201416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,8192,0.02604266670015123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,6144,0.018016889691352844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,8192,0.0403404434521993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,5120,0.015472888946533203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,7168,0.02435644467671712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,7168,0.03798666596412659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,6144,0.022127999199761286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,5120,0.02128622266981337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,5120,0.03393955694304572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,3584,0.011791110866599612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,4096,0.019070222973823547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,4096,0.032904889848497175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,3072,0.010871111518806882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,3584,0.0188080006175571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,3072,0.01789066692193349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,3072,0.03013777732849121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,2560,0.009708444277445475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,2560,0.016880000631014507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,2560,0.029145777225494385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,2048,0.008007999923494127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,2048,0.0148044443792767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,2048,0.02693866689999898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,1536,0.007255111303594377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,1024,0.005592888842026393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,8192,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,1536,0.024453333682484094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,1536,0.014160888062583076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,768,0.004181333300140169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,1024,0.021929777330822412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,1024,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,512,0.003825777934657203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,6144,0.035360889302359685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,768,0.02199911077817281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,768,0.012816000315878125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,256,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,512,0.020901333954599168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,128,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,256,0.02254844374126858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,256,0.011057777537239922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,64,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,128,0.020283554991086323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,128,0.011344888971911537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,32,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,7168,3584,0.030974222554100886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,64,0.010752889017264048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,32,0.010743111371994019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,65536,0.12324799431694879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,65536,0.08655377891328599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,51200,0.0670800010363261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,16384,0.035880890157487653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,16384,0.03219111098183526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,65536,0.12850844860076904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,16384,0.052582220898734204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,7168,4096,0.013099555340078143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,51200,0.10595111052195232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,12288,0.028480887413024902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,10240,0.024911999702453613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,12288,0.025968889395395916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,12288,0.04623644550641378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,8192,0.021511110994550917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,10240,0.04241866535610623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,7168,0.019419555862744648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,8192,0.025085333320829604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,8192,0.0398613346947564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,6144,0.017130666308932833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,51200,0.09722310966915554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,7168,0.022681777675946552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,7168,0.03707289033465915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,5120,0.015328889091809591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,6144,0.022653333014912073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,4096,0.01184800018866857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,6144,0.03523111012246873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,5120,0.03390222125583225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,5120,0.020301333732075162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,3584,0.010088000032636855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,4096,0.01889244384235806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,3072,0.010020444790522257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,3584,0.017941332525677152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,3584,0.03050666716363695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,2560,0.00923999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,3072,0.030504888958401147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,3072,0.01770666738351186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,2048,0.00792622235086229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,2560,0.01609777741962009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,7168,512,0.012063999970753988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,2560,0.02978844443957011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,1536,0.0069066666894488865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,2048,0.024837333295080397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,2048,0.014484445254007975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,1024,0.005097777893145879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,10240,0.02814399864938524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,1536,0.013451555536852943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,768,0.004181333300140169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,1536,0.024285333024130926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,512,0.0034933334423436057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,1024,0.012758221891191272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,1024,0.021962665849261816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,256,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,768,0.02200711104604933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,768,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,128,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,512,0.022307554880777996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,512,0.011887999872366587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,64,0.0025351111673646504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,256,0.01108266661564509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,6144,32,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,128,0.020652444826232064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,128,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,64,0.011702222128709158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,65536,0.10785066419177586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,65536,0.07827911112043592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,4096,0.03145066565937466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,51200,0.08544800016615127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,16384,0.03215466605292426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,51200,0.06129066811667549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,16384,0.03010222315788269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,12288,0.026008889079093933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,16384,0.05259999963972303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,65536,0.12729867299397787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,12288,0.0236826671494378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,51200,0.10544000069300334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,10240,0.022310222188631695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,8192,0.01943555474281311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,12288,0.046000000503328115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,10240,0.028761777612898085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,10240,0.041173332267337374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,7168,0.01755466726091173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,8192,0.03875644339455499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,8192,0.023953777220514085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,6144,256,0.020759110649426777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,6144,0.0155102229780621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,5120,0.014369777507252164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,7168,0.03643555442492167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,7168,0.022594667143291895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,4096,0.011576889289749993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,6144,0.03548355566130744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,6144,0.021644444929228887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,3584,0.01014755583471722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,5120,0.01961511042382982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,6144,32,0.010085333552625444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,3072,0.009347555538018545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,4096,0.03155733479393853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,4096,0.017856000198258292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,2560,0.00847999999920527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,3584,0.01752444439464145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,3072,0.016551110479566786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,3072,0.030185778935750324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,2048,0.007304888632562425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,2560,0.028933333026038274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,2560,0.015116444892353482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,1536,0.005903111149867375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,2048,0.014130666851997375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,2048,0.024696000748210486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,1024,0.004794666750563515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,1536,0.01314222233162986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,1536,0.024353777368863423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,768,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,1024,0.0123848890264829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,512,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,768,0.021944888763957556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,512,0.011409777734014722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,512,0.02130577796035343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,256,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,256,0.020637333393096924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,256,0.011062222222487131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,128,0.002990222225586573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,64,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,128,0.0192239996459749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,128,0.01069155583779017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,5120,32,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,5120,0.03351733419630263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,64,0.011056889262464313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,65536,0.08586400085025364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,3584,0.030644443300035264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,32,0.010047111246320937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,65536,0.07153333557976617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,16384,0.02784622377819485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,51200,0.05726399686601427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,16384,0.0258240004380544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,5120,1024,0.023037332627508376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,16384,0.05192800031767952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,12288,0.0218231115076277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,51200,0.10551289055082534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,10240,0.01908622185389201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,5120,768,0.012631110846996307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,65536,0.12770133548312718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,8192,0.016926222377353244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,12288,0.02306933369901445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,10240,0.025233777032958135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,7168,0.013733333183659447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,10240,0.04201066825124952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,8192,0.022542221678627863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,8192,0.03947110970815023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,6144,0.012350222302807702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,5120,0.010846222440401712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,7168,0.03700622253947788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,7168,0.021029333273569744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,6144,0.035227557023366295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,6144,0.019855999284320407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,4096,0.010441777606805166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,3584,0.00870311094654931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,5120,0.018906666172875296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,5120,0.03342311249838935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,4096,0.031390223238203264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,3072,0.007967111137178209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,4096,0.017854221993022494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,2560,0.007369777394665613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,3584,0.015810666812790763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,3072,0.02803022331661648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,3072,0.015379556351237826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,2048,0.006221333311663733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,51200,0.06787377595901489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,2560,0.027061333258946735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,1536,0.00488711107108328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,2048,0.02608088817861345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,2048,0.013755555782053204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,1024,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,1536,0.013066666821638743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,1536,0.02404266595840454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,768,0.003560888684458203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,1024,0.023303111394246418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,1024,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,512,0.003499555504984326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,768,0.02199199961291419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,768,0.012049777640236748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,256,0.003137777869900068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,512,0.011423110961914062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,512,0.022625777456495497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,12288,0.04439022143681844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,256,0.02030044462945726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,256,0.011028444601429833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,64,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,32,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,128,0.019955555597941082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,64,0.01109866632355584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,65536,0.07789688640170626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,32,0.010040000081062317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,51200,0.06054221921496921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,65536,0.06889155838224623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,4096,3584,0.030180444320042927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,16384,0.023345778385798138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,51200,0.05523555477460226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,2560,0.014793778459231058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,16384,0.0255377772781584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,65536,0.12774488661024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,12288,0.019144889381196763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,16384,0.05128711130883959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,51200,0.10538311137093438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,10240,0.01684888866212633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,12288,0.04385688900947571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,12288,0.02193244463867611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,8192,0.014522666732470194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,10240,0.04233244392606947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,7168,0.013644444445768992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,4096,128,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,8192,0.023641778363121882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,6144,0.011959999799728394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,4096,128,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,7168,0.03678933448261685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,5120,0.010354667074150508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,6144,0.019780443774329293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,6144,0.035749332772360906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,4096,0.009343999955389235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,5120,0.017885333961910672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,5120,0.03424088822470771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,3584,0.008561777571837107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,4096,0.031075557072957356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,4096,0.01661688917213016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,3072,0.007909333540333642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,3584,0.015804444750150044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,3584,0.028861333926518757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,2560,0.0069439998931354946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,3072,0.014491554763582019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,3072,0.02808622188038296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,2048,0.005780444376998478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,2560,0.014071111877759298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,2560,0.027455111344655354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,1536,0.004862222406599256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,2048,0.013752889302041797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,10240,0.02568977740075853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,1536,0.013067555924256643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,1024,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,1536,0.024336889386177063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,768,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,8192,0.03808800048298306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,1024,0.02200711104604933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,1024,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,512,0.003383111208677292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,7168,0.021401777863502502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,768,0.021968000464969214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,768,0.012520000338554382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,512,0.021606221795082092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,512,0.011863110793961419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,128,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,256,0.02165688905451033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,256,0.010864888628323873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,64,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,128,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,128,0.01995644470055898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,64,0.010678222609890832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,65536,0.06365955538219877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3584,32,0.010407110883129967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,51200,0.05106666684150696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,65536,0.06557155317730375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,16384,0.020720889170964558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,51200,0.053878221246931285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,16384,0.0247999992635515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,12288,0.017265778448846605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,16384,0.05156177613470289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3584,2048,0.024139554964171514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,51200,0.10594044129053752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,10240,0.01682577696111467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,12288,0.02126577827665541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,10240,0.023363555471102398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,8192,0.015118221441904703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3584,256,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,8192,0.037351999017927386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,8192,0.020124443703227572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,7168,0.01238666640387641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,6144,0.011346666349305047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,7168,0.03676355547375149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,5120,0.010247999595271217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,6144,0.01861422260602315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,6144,0.03558133376969232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,4096,0.009351111120647853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,5120,0.017328888177871704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,4096,0.015459555718633862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,4096,0.029695110188590154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,3584,0.008163555628723567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,3584,0.030497776137457952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,3584,0.014499555031458536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,3072,0.007463110817803278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,65536,0.12739822599622938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,2560,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,3072,0.014117333624098035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,3072,0.028468443287743464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,12288,0.04407644602987501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,2048,0.005607111172543631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,10240,0.04142133394877116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,2560,0.014097778333557976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,1536,0.004563555535342959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,2560,0.026149332523345947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,2048,0.025681777132882014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,2048,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,1024,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,1536,0.024041778511471216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,768,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,1024,0.023009777069091797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,1024,0.0123831108212471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,7168,0.019698666201697457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,512,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,768,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,256,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,512,0.021937777598698933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,512,0.011352889239788055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,128,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,5120,0.03423644436730279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,256,0.021780444516075984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,256,0.010681777364677854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,64,0.002485333424475458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,128,0.02038666605949402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,128,0.010632889138327705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,64,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,65536,0.05755644374423557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,32,0.01073333372672399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,51200,0.0449795557392968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,65536,0.06401155392328899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,51200,0.05198666784498426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,16384,0.018939556346999276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,65536,0.12731999821133083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,51200,0.10530222124523586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,3072,1536,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,16384,0.024315555890401203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,16384,0.05044088761011759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,10240,0.014334221680959066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,12288,0.020915556285116408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,12288,0.04443822304407755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,3072,768,0.0226239992512597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,8192,0.01256977766752243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,10240,0.022965333527988855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,10240,0.04158133268356323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,7168,0.011904000408119626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,8192,0.01954844428433312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,6144,0.010779555473062726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,7168,0.035806222094429865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,3072,32,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,7168,0.0188719994492001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,5120,0.00999466660949919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,6144,0.017439999514155917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,6144,0.033533334732055664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,4096,0.008749333520730337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,5120,0.015846222639083862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,5120,0.03382222188843621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,3584,0.007989333735571967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,4096,0.029912001556820337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,4096,0.014474666780895658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,3072,0.007239999870459239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,3584,0.014145778285132514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,3584,0.0284204449918535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,2560,0.006270222365856171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,3072,0.027091556125217017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,3072,0.013418667018413544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,2048,0.0052595556610160405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,2560,0.026050666968027752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,1536,0.00452888881166776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,2048,0.025702221526039973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,12288,0.015544889701737298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,1024,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,1536,0.012753778033786349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,1536,0.025059555967648823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,768,0.0035031110876136353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,1024,0.022634666826989915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,1024,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,512,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,768,0.0120328888297081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,8192,0.03881511092185974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,768,0.022859555151727464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,256,0.0031964443624019623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,512,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,512,0.022960889670583937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,128,0.0028035555862718155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,256,0.011360000405046674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,256,0.02197155521975623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,64,0.0027235555979940626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2560,32,0.002528888897763358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2560,128,0.020937777227825586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,64,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,65536,0.05163822240299649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,32,0.010453333457310995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,51200,0.03654311100641886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,65536,0.06190311246448093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,16384,0.016034666034910414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,2560,0.013764444324705334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,51200,0.050395554966396756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,65536,0.12668800354003906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,12288,0.014863999353514777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,2048,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,16384,0.02353422178162469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,51200,0.10620355606079102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,12288,0.04407466782463921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,8192,0.012081777883900536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,10240,0.021184888150956895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,10240,0.04204266601138645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,8192,0.03869422276814779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,8192,0.019136000010702345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,7168,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,7168,0.017151110702090792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,7168,0.03732266690995958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,6144,0.010323555933104621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2560,128,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,5120,0.009758222434255812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,6144,0.015997333659066092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,6144,0.03422310948371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,4096,0.008090666598743862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,5120,0.01516888870133294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,5120,0.03221688999070062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,3584,0.007285333342022366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,4096,0.01442577772670322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,4096,0.029143999020258587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,3072,0.006543111056089401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,3584,0.014130666851997375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,3584,0.027433777848879497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,2560,0.005662222289376789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,16384,0.05017333229382833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,3072,0.013580444786283704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,2048,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,3072,0.028113779094484117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,2560,0.025419554776615564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,2560,0.01313244468635983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,1536,0.004516444272465176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,2048,0.025038222471872967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,2048,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,1024,0.003891555385457145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,1536,0.023778667052586872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,768,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,1024,0.01238044434123569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,768,0.011720000041855706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,512,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,512,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,512,0.020968889196713764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,256,0.0031102223114834893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,256,0.01074577785200543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,10240,0.01311466677321328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,128,0.002653333254986339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,12288,0.020555555820465088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,256,0.020741333564122517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,64,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,128,0.010679999987284342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,128,0.020579554968410067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,2048,32,0.002529777793420686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,1536,0.01240711079703437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,64,0.010676444404655032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,2048,32,0.010746666954623329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,1024,0.023039110832744177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,51200,0.029267556137508813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,65536,0.059584889147016734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,2048,768,0.022652443912294176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,16384,0.01386755539311303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,51200,0.049104889233907066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,65536,0.1273039976755778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,12288,0.013109332985348172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,16384,0.023581332630581323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,51200,0.10479378037982517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,16384,0.049913777245415576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,10240,0.011685333318180509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,8192,0.010326222413116032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,12288,0.020396444532606337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,10240,0.041287110911475286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,10240,0.01984177695380317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,7168,0.009600888523790572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,8192,0.01687111126052009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,8192,0.03645777702331543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,6144,0.009586667021115622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,7168,0.015815999772813585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,7168,0.03423110975159539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,5120,0.008650666309727563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,6144,0.015189333094490899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,6144,0.033596442805396184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,4096,0.007931555310885111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,5120,0.014779556128713818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,5120,0.03050133254792955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,3584,0.007251555720965068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,4096,0.01407911048995124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,3072,0.006789333290523953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,3584,0.013752000199423896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,65536,0.03662577933735318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,2560,0.00565244464410676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,3072,0.01347555551264021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,3072,0.02644355595111847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,2048,0.005199111170238919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,2560,0.012740444805887012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,2560,0.026716444227430556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,1536,0.004565333326657613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,2048,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,2048,0.024455999334653217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,1024,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,1536,0.012278222375445895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,1536,0.023737778266270954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,12288,0.044192890326182045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,1024,0.022330666581789654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,1024,0.01200355589389801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,512,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,768,0.022664889693260193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,768,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,256,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,512,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,512,0.022321777211295232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,128,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,256,0.010685332947307162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,256,0.020281778441535104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,64,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,128,0.020633776982625324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,4096,0.028676443629794653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,32,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,65536,0.025368889172871906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,64,0.011066666907734342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1536,3584,0.027239999837345544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,51200,0.02142222225666046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,32,0.010049777726332346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,65536,0.05716088745329115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,16384,0.01221333361334271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,65536,0.12668089071909586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,51200,0.046536889341142446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,51200,0.10538133647706772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,12288,0.011811555259757571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,16384,0.022291556000709534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,16384,0.05008088880115085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,10240,0.01032977799574534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,12288,0.01904088921017117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1536,768,0.0036684444381131064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,8192,0.009344889058007134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,10240,0.018185777796639335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,10240,0.039298666848076716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,7168,0.009701333112186855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,8192,0.03558933403756883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,8192,0.016526222229003906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,6144,0.008743999732865227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,7168,0.015806222955385845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,7168,0.0332275562816196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,5120,0.007992888490358988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,6144,0.015608888533380298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,4096,0.007814221911960179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,5120,0.014202665951516895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1536,128,0.011735111474990845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,3584,0.006959999601046245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,4096,0.014089778065681458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,4096,0.028146667612923518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,3072,0.006232000059551663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,3584,0.029125332832336426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,3584,0.013861333330472311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,2560,0.005608888963858287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,3072,0.013064000341627332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,3072,0.027116444375779893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,2048,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,2560,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,2560,0.025369778275489807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,1536,0.005616000129116907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,2048,0.0127368892232577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,2048,0.025349333882331848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,12288,0.04187822341918945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,1024,0.004559111264016894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,1536,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,768,0.003899555653333664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,1536,0.025046222739749487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,1024,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,1024,0.022664889693260193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,512,0.003616888903909259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,768,0.022687999738587275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,768,0.011538666983445486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,256,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,512,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,512,0.020255110330051847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,6144,0.03186310993300544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,256,0.02162844439347585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,256,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,64,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,5120,0.030365334616767034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,32,0.002529777793420686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,1024,128,0.01921066641807556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,128,0.011040888726711273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,65536,0.023638221952650283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,64,0.011038222246699862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,51200,0.019329778022236295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,1024,32,0.010729778144094678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,16384,0.010943999720944298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,65536,0.05558844407399496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,65536,0.1266124380959405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,51200,0.04548622171084086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,12288,0.011014222270912595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,51200,0.1052488883336385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,16384,0.021381333470344543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,10240,0.009460444251696268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,8192,0.008654221892356873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,12288,0.018545778261290658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,12288,0.04272888766394722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,10240,0.017535110314687092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,10240,0.039023998710844256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,7168,0.009319110876984065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,6144,0.008683555656009251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,8192,0.01629066632853614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,8192,0.034625778595606484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,7168,0.015971556305885315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,5120,0.00797155582242542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,6144,0.03185866607560052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,5120,0.014624888698259989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,4096,0.007317333585686154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,1024,128,0.0028497777465316984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,4096,0.013993778162532382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,3584,0.0069822221994400024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,4096,0.029595557186338637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,3584,0.013510222236315409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,3072,0.006241777704821692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,16384,0.04890577660666572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,3072,0.013443555268976422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,2560,0.005600000007285013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,3072,0.026400888959566753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,2560,0.013075555364290873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,2048,0.005029333134492238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,2560,0.02537422213289473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,7168,0.03354488809903463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,1536,0.004908444566859139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,6144,0.015474667151769003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,2048,0.012735111018021902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,2048,0.024117334021462336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,1024,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,1536,0.02400711178779602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,768,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,1024,0.011426666544543372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,512,0.0034888887570963967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,768,0.021353777911927965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,512,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,512,0.020233778489960563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,256,0.0031555555760860443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,3584,0.028459555572933618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,128,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,256,0.010666666759385003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,128,0.01891288823551602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,128,0.011796444654464722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,64,0.0028560000161329904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,768,32,0.0024871110088295406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,64,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,32,0.010029333333174387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,65536,0.018329777651362948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,65536,0.05391200052367317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,65536,0.12751021650102404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,51200,0.016061334146393668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,5120,0.030745777818891738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,16384,0.010144000252087912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,1024,0.023349333140585158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,51200,0.04492888847986857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,768,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,12288,0.01036888857682546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,16384,0.020908445119857788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,16384,0.048604445325003735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,10240,0.009311999711725447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,12288,0.04180977741877238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,12288,0.018887110882335238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,8192,0.00831200016869439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,10240,0.03901688920127021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,10240,0.01755644381046295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,7168,0.00905777762333552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,768,256,0.020577778418858845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,6144,0.008295111358165741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,8192,0.03631733192337884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,7168,0.034006221426857844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,7168,0.015832889411184523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,5120,0.00794400026400884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,6144,0.03278933299912347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,4096,0.007306666837798224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,5120,0.014803555276658801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,5120,0.030498666895760432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,3584,0.006924444602595435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,4096,0.014109333356221518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,4096,0.029150221082899306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,3072,0.006568888823191325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,3584,0.013153778182135688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,3584,0.02847111225128174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,2560,0.006264888991912206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,3072,0.013450666434235044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,768,1536,0.01204533295498954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,3072,0.027004443936877783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,2048,0.005601777798599667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,2560,0.01313066648112403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,1536,0.004261333495378494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,2048,0.012381333443853589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,2048,0.024343111448817786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,1024,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,1536,0.023432888918452795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,1024,0.011077333655622272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,768,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,1024,0.021273778544531927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,8192,0.016541333662139047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,512,0.0032257777121331957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,768,0.021613332960340712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,6144,0.015139554937680563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,256,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,512,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,512,0.020597333709398907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,128,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,256,0.021384000778198242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,128,0.011060444845093621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,128,0.020250666472646926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,64,0.002502222235004107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,64,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,2560,0.026740445031060114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,512,32,0.002528000002106031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,512,51200,0.1038808888859219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,65536,0.017664000391960144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,32,0.01036800030204985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,1536,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,51200,0.01481244464715322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,65536,0.0529333319928911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,65536,0.12553332911597356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,16384,0.009311999711725447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,51200,0.04387111133999295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,16384,0.021270222134060327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,768,0.0110880004035102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,12288,0.018765333626005385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,12288,0.04140977727042304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,10240,0.007592889169851939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,512,256,0.010679110884666443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,8192,0.006931555353932911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,10240,0.03900622328122457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,10240,0.01722311145729489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,7168,0.006312888943486744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,8192,0.035636444886525474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,8192,0.016162667009565566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,6144,0.006806222101052602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,7168,0.015569777952300178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,7168,0.034316443734698825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,5120,0.006618666566080517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,6144,0.015056888262430826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,6144,0.0321777794096205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,4096,0.005928888916969299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,5120,0.01479200025399526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,4096,0.013416888813177744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,4096,0.029483556747436523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,51200,0.10428000158733791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,12288,0.008251555263996124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,3072,0.006167999986145232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,3584,0.02809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,3584,0.01347644461525811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,2560,0.006232888748248418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,3072,0.013419555293189155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,3072,0.027882665395736694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,2048,0.005899555567238066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,2560,0.012878222597969903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,2560,0.02641777859793769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,1536,0.004560889055331548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,2048,0.012891555825869242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,2048,0.025402666793929204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,1024,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,1536,0.012521777715947894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,1536,0.024353777368863423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,768,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,1024,0.012167111039161682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,1024,0.022827555735905964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,512,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,768,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,768,0.022328888376553852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,5120,0.03012977706061469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,256,0.0028924445311228433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,128,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,512,0.011033777561452655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,256,0.01143022212717268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,256,0.020311999652120803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,128,0.019888000355826486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,32,0.002512000087234709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,16384,0.04719733198483785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,65536,0.014846222268210517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,64,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,51200,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,32,0.01108444482088089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,65536,0.05004355642530653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,65536,0.12442044417063396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,16384,0.00776533368561003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,51200,0.041504889726638794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,51200,0.10276977883444892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,12288,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,16384,0.020634666085243225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,16384,0.04752177662319607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,10240,0.006908444480763541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,12288,0.04074133435885111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,8192,0.006635555376609166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,10240,0.0173680004146364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,10240,0.037689778539869524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,7168,0.0062871111763848206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,8192,0.016148444679048326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,8192,0.03495555453830295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,6144,0.006229333165619109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,7168,0.015470221638679504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,7168,0.03383466601371765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,5120,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,256,512,0.022259554929203455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,6144,0.01498044364982181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,6144,0.031839112440745033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,4096,0.005585777676767773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,256,3584,0.005554666535721884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,3584,0.005570666657553778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,5120,0.03152799937460158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,5120,0.014430221584108142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,4096,0.013400889105266996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,4096,0.028429332706663344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,3072,0.00591822216908137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,3584,0.027360000544124182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,3584,0.013399110900031196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,2560,0.005888000130653381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,3072,0.013073777986897362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,3072,0.026038222842746313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,2048,0.00526311124364535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,2560,0.025241777300834656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,1536,0.004541333350870344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,2048,0.012111110819710625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,2048,0.02398577829202016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,1024,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,12288,0.01864355636967553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,1536,0.023370666636361018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,768,0.003488000068399641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,1024,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,1024,0.022999111149046157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,512,0.0031973332580592898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,768,0.01107022249036365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,512,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,512,0.020920000142521326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,256,0.002875555513633622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,256,0.02165688905451033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,256,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,128,0.0025253333151340485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,256,128,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,64,0.002487999904486868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,128,0.020107555720541213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,128,0.01036088913679123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,128,32,0.002510222295920054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,65536,0.011525332927703857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,64,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,51200,0.01034400032626258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,32,0.010328888893127441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,16384,0.006948444578382704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,2560,0.012423999607563019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,65536,0.050272888607449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,51200,0.041802667909198336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,10240,0.006575999988449945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,16384,0.020633776982625324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,128,1536,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,12288,0.0188719994492001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,7168,0.006605333338181178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,10240,0.017543110582563613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,6144,0.005950222412745158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,8192,0.015858666764365304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,12,128,768,0.021317332983016968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,5120,0.0052782222628593445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,4096,0.005385777602593104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,6144,0.01514311134815216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,3584,0.0059057776298787855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,5120,0.014441778262456259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,4096,0.013752889302041797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,3584,0.013761777844693927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,2560,0.006242666807439592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,3072,0.013063111239009433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,2048,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,2560,0.013085333009560903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,1536,0.00424799985355801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,2048,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,1024,0.003571555432346132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,1536,0.012445333103338877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,768,0.003546666767862108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,1024,0.011399110986126794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,512,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,8192,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,768,0.011946666571829053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,256,0.0024968888610601425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,128,0.0025235555238193935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,512,0.011039999624093374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,64,0.00254133323000537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,256,0.01105955574247572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,7168,0.015787555111779105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,128,0.010374222364690568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,32,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,65536,0.011077333655622272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,51200,0.010321777727868822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,64,0.010399111443095738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,16384,0.006952889263629913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,64,32,0.011026666396194033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,3072,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,65536,0.049660444259643555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,16384,0.020767110917303298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,8192,0.006144000010357962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,12288,0.018631999691327412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,7168,0.006278222219811545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,8192,0.015857777661747403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,6144,0.005608888963858287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,7168,0.015792888071801927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,5120,0.00555644432703654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,6144,0.014835556348164877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,4096,0.005566222386227713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,64,12288,0.006820444431569841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,5120,0.014448889427714877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,3584,0.005622222191757626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,3072,0.00554577757914861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,4096,0.013773333695199756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,3584,0.01348088930050532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,2560,0.005923555543025334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,3072,0.012788444757461548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,2048,0.005227555417352253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,2560,0.012892444100644855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,1536,0.00423200014564726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,2048,0.012401777837011548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,1024,0.0035582222044467926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,12288,0.006576889091067844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,1536,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,10240,0.006280888699822956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,1024,0.011083555718262991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,512,0.00314666661951277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,256,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,768,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,10240,0.016953777935769822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,128,0.0025333333760499954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,512,0.011027555498811932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,64,0.002528888897763358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,256,0.010341333018408881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,128,0.010337777435779572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,64,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,32,0.009689778089523315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,16384,0.3235982259114583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,51200,0.4986746576097276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,768,0.003666666646798452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,16384,0.1709360016716851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,12,32,51200,0.04174222217665779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,12288,0.22677244080437553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,51200,0.9642284181382922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,10240,0.18859733475579155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,12288,0.13022843996683756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,12,32,32,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,10240,0.12741511397891575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,6144,0.11530044343736436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,7168,0.1335457828309801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,7168,0.10019110971026951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,5120,0.09675911400053237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,6144,0.08894755442937215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,8192,0.11684355470869277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,4096,0.08122755421532525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,3584,0.0688026679886712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,3072,0.06022666560278999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,4096,0.06691910823186238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,5120,0.0825022194120619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,3584,0.05998488929536608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,2560,0.051113777690463595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,2048,0.04221066501405504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,1536,0.032681776417626276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,3072,0.053123556905322604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,2560,0.04867022236188253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,1024,0.023167999254332647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,768,0.018788443671332467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,512,0.013399110900031196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,1536,0.03194844391610887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,1024,0.02683288852373759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,256,0.008274666965007782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,128,0.006540444576077991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,768,0.02256800068749322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,512,0.01955200069480472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,64,0.005574222240183089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,32,0.0058871110280354815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,128,0.014099554883109199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,256,0.017126222451527912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,64,0.015250666273964776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,65536,8192,0.15437066555023193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,32,0.01550044450494978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,16384,0.27831021944681805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,65536,0.5266737937927246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,51200,0.4008435673183865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,16384,0.1394959953096178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,65536,2048,0.0420595539940728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,12288,0.20891200171576607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,10240,0.16910400655534533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,12288,0.1064373321003384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,8192,0.14055644141303167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,10240,0.12855999999576145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,65536,1.0927004284328885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,7168,0.12050844563378228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,6144,0.1061662236849467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,8192,0.11683911747402614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,7168,0.08137066496743096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,6144,0.07362844546635945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,3584,0.06437333424886067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,4096,0.05999822086758084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,3072,0.05572711096869575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,3584,0.05199822121196323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,5120,0.06830488973193698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,5120,0.08950310945510864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,2048,0.03745511174201965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,1536,0.029539555311203003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,2560,0.042711112234327525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,2048,0.036955555280049644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,1024,0.021947556071811255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,768,0.01610933409796821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,1536,0.028140445550282795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,1024,0.023378666904237535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,512,0.011347555451922946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,256,0.007299555672539606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,768,0.020230222079488967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,51200,0.8218293190002441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,512,0.017423111531469557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,128,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,64,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,128,0.013122667041089801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,32,0.003536000019974179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,256,0.01443822185198466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,64,0.014827556080288358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,4096,0.07299377520879109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,32,0.014362666341993542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,51200,2560,0.04755022128423055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,51200,3072,0.044490665197372437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,51200,0.14118044906192356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,65536,0.31893600357903373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,16384,0.09127999676598443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,12288,0.07095733616087171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,10240,0.05338399940066867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,12288,0.044998221927218966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,10240,0.05230489042070177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,8192,0.044793777995639376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,16384,0.056129780080583364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,7168,0.03882133298450046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,6144,0.033540444241629705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,5120,0.028691556718614366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,7168,0.03790666659673055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,4096,0.024005333582560223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,6144,0.0344106654326121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,5120,0.03535822365019057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,3584,0.021353777911927965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,3072,0.018744000130229525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,4096,0.027495111028353374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,3584,0.025685333543353613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,2560,0.015831111205948722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,3072,0.02289688918325636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,2048,0.012830221818553077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,1536,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,2560,0.022634666826989915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,1024,0.008285333712895712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,65536,0.18507022327846953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,51200,0.24944000773959688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,1536,0.01792977750301361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,512,0.005261333452330695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,1024,0.01610133383009169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,768,0.013776000175211163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,512,0.013767110804716745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,128,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,256,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,64,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,128,0.012231999801264869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,32,0.0028844444702068963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,8192,0.04292088747024536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,64,0.011767110890812345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,32,0.011784888803958893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,65536,0.2533564567565918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,65536,0.15756355391608343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,51200,0.1993244489034017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,16384,0.06714755296707153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,12288,0.05220444334877861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,16384,0.05018844538264804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,16384,2048,0.019661333825853135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,51200,0.12230932712554932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,10240,0.04474222328927782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,768,0.00702133360836241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,8192,0.03757066528002421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,7168,0.03274310959710015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,6144,0.028804444604449805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,10240,0.043735110097461276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,5120,0.02555022140343984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,16384,256,0.003277333246337043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,8192,0.03806844353675842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,7168,0.03762222329775492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,4096,0.020422221885787118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,3584,0.017490666773584154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,6144,0.030431999100579157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,3072,0.015494222442309061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,2560,0.013170666992664337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,5120,0.028964443339241877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,2048,0.011389333340856763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,3584,0.023959111836221483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,1536,0.009527111219035255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,3072,0.021244444780879553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,1024,0.007919111185603673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,768,0.00656088896923595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,2048,0.019293333093325298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,512,0.004537777768241035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,1536,0.0166320006052653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,1024,0.014133334159851074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,256,0.003539555602603488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,768,0.013436444103717804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,512,0.013463111387358772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,256,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,64,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,32,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,128,0.011386666860845355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,64,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,32,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,65536,0.21765955289204916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,51200,0.17171733909183076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,65536,0.15086577998267278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,12288,0.04008622301949395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,16384,0.05981155236562093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,51200,0.11723555458916558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,12288,0.04637777805328369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,16384,0.04779377910825941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,10240,0.038359112209743924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,8192,0.03244888782501221
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,4096,0.02677333354949951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,12288,0.038690666357676186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,7168,0.028976887464523315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,10240,0.03878488805558946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,12288,2560,0.021328889661365088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,6144,0.025975111458036635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,5120,0.022462222311231825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,8192,0.034041778908835515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,7168,0.028421332438786823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,4096,0.018869333797030978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,3584,0.0158924443854226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,6144,0.028088887532552082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,3072,0.01440533333354526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,5120,0.02639644510216183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,2560,0.012410666379663678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,4096,0.022823999325434368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,3584,0.022239999638663396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,2048,0.010766222245163388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,1536,0.008957333034939235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,3072,0.01961511042382982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,1024,0.007648000286685095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,2560,0.019367110398080613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,768,0.005894222193294101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,2048,0.01779111060831282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,512,0.004874666531880696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,1536,0.015450666348139444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,256,0.0035573335157500375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,1024,0.01314311143424776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,128,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,768,0.01346577786737018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,64,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,10240,32,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,256,0.011760888828171624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,128,0.011031111081441244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,64,0.012072888513406118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,32,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,65536,0.17374666531880698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,51200,0.1307928827073839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,16384,0.045500444041358105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,65536,0.10462044345008002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,12288,0.03305600086847941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,51200,0.07932000027762519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,10240,0.027572444743580286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,12288,0.030015110969543457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,16384,0.03626577721701728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,8192,0.025444444682863023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,10240,0.031714667876561485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,7168,0.021734222769737244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,6144,0.01903555625014835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,5120,0.016488000750541687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,8192,0.026556443836953905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,7168,0.02437422176202138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,6144,0.023375110493765935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,4096,0.01407911048995124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,3584,0.012576888832781049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,5120,0.021254221598307293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,3072,0.011516444385051727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,4096,0.019535111056433786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,2560,0.010043555663691627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,3584,0.019558222757445443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,2048,0.00830577810605367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,1536,0.007267555428875818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,3072,0.017628444565667045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,2560,0.01686755485004849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,1024,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,10240,512,0.01310400002532535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,768,0.004537777768241035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,2048,0.015917332635985482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,1536,0.013753777576817406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,1024,0.012626666989591388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,768,0.012764444781674279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,512,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,128,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,64,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,256,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,32,0.0027991111079851785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,128,0.010746666954623329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,64,0.011737777955002256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,8192,32,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,65536,0.14946756098005506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,51200,0.11756355232662624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,65536,0.09433777464760675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,16384,0.04193333453602261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,12288,128,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,51200,0.0726755526330736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,16384,0.03467999895413717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,10240,0.02823288904296027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,12288,0.02830044428507487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,8192,0.021922666165563796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,7168,0.02033333314789666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,10240,0.03015111221207513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,6144,0.018153778380817838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,7168,0.02329866588115692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,512,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,5120,0.015799111790127225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,8192,256,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,6144,0.02275644408331977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,4096,0.013748444616794586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,3584,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,5120,0.02092355489730835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,4096,0.019415999452273052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,3584,0.018720888429217868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,2560,0.009649777577983009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,2048,0.008399999803966945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,3072,0.017496888836224873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,1536,0.00721244431204266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,2560,0.016840888394249808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,1024,0.005159111072619756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,2048,0.015545777148670621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,768,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,1536,0.013424889081054263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,512,0.0035342222286595237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,1024,0.012447111308574677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,256,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,768,0.01276266657643848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,12288,0.032813333802753024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,128,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,512,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,64,0.002842666581273079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,256,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,128,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,64,0.011492444409264458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,32,0.010363555616802638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,7168,8192,0.026349332597520616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,65536,0.12262933784061009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,51200,0.09700622161229451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,16384,0.0358586675590939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,65536,0.0865466660923428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,12288,0.028757333755493164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,51200,0.0665902230474684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,10240,0.024492444263564214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,16384,0.03183111217286851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,8192,0.021789333886570398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,12288,0.025823111335436504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,7168,0.01924622224436866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,10240,0.027160889572567407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,6144,0.017148445049921673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,5120,0.01514400045077006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,7168,0.022630222969584998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,6144,0.021943999661339655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,4096,0.011738667057620155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,3584,0.010321777727868822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,4096,0.01887999971707662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,3072,0.010318222145239512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,3584,0.01888088881969452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,2560,0.008967999782827165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,3072,0.017027555240525138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,2048,0.007912889122962952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,2560,0.016502221425374348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,1536,0.0069573331210348345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,2048,0.014903111590279473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,1024,0.004855111241340637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,1536,0.013434666726324292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,768,0.0038942222793896994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,3072,0.01089866707722346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,1024,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,512,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,768,0.0123857781291008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,256,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,128,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,8192,0.024680000212457445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,512,0.012320000264379712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,64,0.0024782222592168385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,256,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,6144,32,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,128,0.011367110742463006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,5120,0.020258666740523446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,64,0.0120328888297081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,65536,0.10770666599273682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,6144,32,0.010863111250930362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,51200,0.0854053364859687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,16384,0.0321777794096205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,12288,0.026113778352737427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,65536,0.07834488815731473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,51200,0.0611635579003228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,10240,0.022034666604465906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,16384,0.029521776570214167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,8192,0.019472888774342008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,12288,0.02358755634890662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,7168,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,7168,0.017335999343130324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,6144,0.015621332658661736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,5120,0.013960889644092984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,10240,0.02565777798493703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,8192,0.02405599918630388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,4096,0.011719110939237805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,7168,0.023696889479955036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,3072,0.009377777576446533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,5120,0.019887111253208585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,2560,0.008599110775523717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,3584,0.017699556218253244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,2048,0.007272000114123027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,3072,0.01570666664176517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,1536,0.005929777605666055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,2560,0.015160888433456421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,2048,0.014464888307783337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,1024,0.004590222405062782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,1536,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,768,0.0041804446114434134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,1024,0.013105777402718862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,512,0.003530666646030214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,768,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,256,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,512,0.012431999875439538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,128,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,256,0.011411555939250521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,128,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,32,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,64,0.011039999624093374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,5120,3584,0.01036088913679123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,6144,0.020613332589467365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,65536,0.08574133449130589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,32,0.011014222270912595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,5120,4096,0.018351111147138808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,51200,0.06737333536148071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,16384,0.027679110566775005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,65536,0.0709457794825236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,12288,0.021615111165576514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,51200,0.05669422282112969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,10240,0.01906488835811615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,8192,0.01685333251953125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,10240,0.023920888702074688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,7168,0.013739555246300168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,8192,0.022625777456495497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,7168,0.02091644373204973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,5120,0.01089422239197625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,6144,0.019575110740131803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,4096,0.010320888625250923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,3584,0.008926221893893348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,5120,0.018752889500723947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,3072,0.00815822184085846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,4096,0.01704355577627818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,2560,0.007269333634111617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,3584,0.016145777371194627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,2048,0.005924444645643234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,3072,0.015125332607163323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,1536,0.004545777622196409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,2048,0.013840888937314352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,1024,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,1536,0.013059555656380124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,768,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,1024,0.012101333174440594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,512,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,768,0.012121777567598553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,256,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,16384,0.026334222820070054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,12288,0.022608000371191237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,512,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,128,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,64,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,32,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,4096,6144,0.012362666428089142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,256,0.0110871113008923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,128,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,64,0.011368888947698804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,51200,0.06050933069652981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,16384,0.02422399984465705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,51200,0.055071999629338585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,12288,0.019103111492262948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,16384,0.025732444392310247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,10240,0.01657777859105004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,12288,0.021751999855041504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,2560,0.014436443646748861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,8192,0.014699555105633207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,10240,0.0240320000383589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,7168,0.013563555147912769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,6144,0.011969777444998423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,8192,0.02124799953566657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,5120,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,7168,0.020668443706300523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,4096,0.009619555539555019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,6144,0.019318222999572754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,3584,0.008374222450786168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,5120,0.018166222506099276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,3072,0.007693332930405934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,4096,0.01683288812637329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,2560,0.006940444310506185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,3584,0.015822221835454304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,2048,0.005797333187527127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,3072,0.014123555686738757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,1536,0.004515555583768421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,2560,0.014799111419253878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,65536,0.0788524415757921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,1024,0.0038817777401871155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,4096,32,0.010694222317801582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,768,0.003546666767862108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,512,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,65536,0.06886221965154012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,1536,0.012772444221708508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,256,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,1024,0.012033777932325998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,128,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,768,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,64,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,512,0.012077333198653327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,256,0.011389333340856763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3584,32,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,128,0.011038222246699862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,65536,0.06327288680606417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,32,0.00999022192425198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,51200,0.05130044288105435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,16384,0.02068622244728936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,65536,0.0662977761692471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,12288,0.01681155628628201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,51200,0.05299466517236498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,16384,0.02479822271400028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,10240,0.01650044487582313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,8192,0.014864888456132678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,12288,0.02125777800877889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,7168,0.012418666647540199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,10240,0.021968000464969214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,6144,0.011032000184059143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,8192,0.020849777592553034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,5120,0.010017777482668558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,7168,0.019480889042218525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,4096,0.009091555244392818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,6144,0.01811555524667104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,3584,0.00795733349190818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,2048,0.013771555489963956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,4096,0.015391111373901367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,3072,0.007532444265153673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,2560,0.006582222051090664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,3584,0.014807111687130399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,2048,0.0052151112920708126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,3072,0.01386755539311303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,1536,0.004541333350870344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,2560,0.014097778333557976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,1024,0.004061333421203825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,2048,0.013426666458447775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3584,64,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,768,0.003547555456558863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,1536,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,1024,0.012498666842778524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,256,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,512,0.011529777612951068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,128,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,64,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,256,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,128,0.011066666907734342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,65536,0.05713599920272827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,64,0.011384000380833944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,32,0.01038933296998342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,51200,0.045112000571356885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,16384,0.018910222583346896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,65536,0.06365244256125556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,51200,0.05164088805516561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,12288,0.015446222490734525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,10240,0.014442667365074158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,16384,0.02404622236887614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,8192,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,12288,0.021149333980348375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,7168,0.012092444631788464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,10240,0.02257066633966234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,6144,0.010674667027261523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,8192,0.01961777773168352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,5120,0.009992000129487779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,7168,0.018778666853904724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,4096,0.008856000171767341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,3072,512,0.0031946665710873077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,3584,0.00795199970404307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,5120,0.01570755574438307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,768,0.011715555356608497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,3072,0.00692622239391009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,4096,0.014840889308187695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,2560,0.006056889063782162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,2048,0.005224888937340842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,3584,0.014482667048772177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,1536,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,3072,0.01369599997997284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,1024,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,2048,0.013074666261672974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,768,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,1536,0.012747555143303342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,512,0.003548444559176763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,1024,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,256,0.0031840000301599503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,768,0.011773332953453064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,128,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,512,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,3072,5120,0.01681066718366411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,256,0.011048888994587792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,32,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,128,0.010747555229398938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,64,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,65536,0.05265955461396111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,32,0.010681777364677854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,51200,0.036947555012173124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,16384,0.016233777006467182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,65536,0.06128355529573229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,51200,0.04997333221965366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,12288,0.01457244488928053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,6144,0.01683111157682207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,10240,0.013203555511103736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,16384,0.023706666297382776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,8192,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,12288,0.02058577703105079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,10240,0.02165688905451033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,7168,0.01106844428512785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,6144,0.010306666294733683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,8192,0.0188719994492001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,5120,0.009712888962692684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2560,2560,0.013816888961527081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,7168,0.016894222961531747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,4096,0.008293333152929941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,6144,0.015736889508035447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,3584,0.007258666886223688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,3072,0.006577777779764599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,5120,0.015076445208655464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,4096,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,3584,0.014175999495718213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,2048,0.0052426668504873914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,3072,0.01368711143732071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,1536,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2560,64,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,2560,0.013358222113715278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,1024,0.0038844446341196695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,768,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,1536,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,1024,0.01148888882663515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,512,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,256,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,768,0.012067555553383298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,128,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,512,0.011761777930789523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,256,0.01204177737236023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,64,0.0026462222966882917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,32,0.0025946667624844448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,64,0.011363555159833698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,32,0.010679999987284342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,65536,0.036580443382263184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,51200,0.029113776153988306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,65536,0.05935111310746935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,16384,0.014104889498816596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,51200,0.048042668236626514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,2048,2560,0.005683555371231503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,12288,0.01276000009642707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,10240,0.011360000405046674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,16384,0.02312266661061181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,8192,0.01015911085738076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,7168,0.009924444059530893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,12288,0.02015555567211575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,10240,0.01886399918132358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,6144,0.009532444179058075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,2048,0.012465777496496836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,5120,0.00888888869020674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,4096,0.007884444461928474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,7168,0.01591911084122128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,3584,0.0069715554515520734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,6144,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,3072,0.00620977787507905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,5120,0.014497778481907315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,2560,0.005604444278611078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,4096,0.014115555418862237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,2048,0.005207111024194294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,3072,0.013468444347381592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,2048,128,0.011742221812407175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,1536,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,2560,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,1024,0.0038559999730851916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,2048,0.01274400038851632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,768,0.0036657779581016968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,512,0.003208000005947219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,1024,0.01163200040658315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,256,0.0028071111689011254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,768,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,128,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,512,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,64,0.002587555597225825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,256,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1536,32,0.0025111111915773815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,128,0.011410666836632622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,64,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,32,0.009992000129487779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,51200,0.02145599987771776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,65536,0.05645333396063911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,16384,0.011571555501884885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,8192,0.01683200067943997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,12288,0.0114702218108707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,51200,0.046444445848464966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,10240,0.010117332968446944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,16384,0.022950222094853718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,8192,0.009286222358544668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,12288,0.018930666976504855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,3584,0.013784888717863293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,7168,0.00964355551534229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,10240,0.018239110708236694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,6144,0.008836444053384993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,5120,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,7168,0.01585244470172458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,6144,0.0151235560576121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,4096,0.007266666326257918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,3584,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1536,1536,0.01276000009642707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,4096,0.01384888920519087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,3072,0.006221333311663733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,3584,0.014122666584120857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,2560,0.005595555735958948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,3072,0.013204444613721637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,65536,0.025788444611761305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,2048,0.007304000357786815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,2560,0.013428444663683573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,2048,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,1024,0.004517333375083076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,1536,0.012431999875439538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,768,0.0042168887125121225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,1024,0.012227555943859948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,768,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,256,0.003362666608558761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,512,0.011855111353927188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,8192,0.01647822227742937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,128,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,64,0.002558222247494592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,256,0.01107022249036365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,32,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,5120,0.01479200025399526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,128,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,64,0.011382222175598145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,65536,0.02353422178162469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,1024,32,0.009679999616410997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,51200,0.01928622192806668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,16384,0.011055111057228513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,12288,0.010676444404655032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,65536,0.055107557111316256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,10240,0.00980977796845966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,51200,0.045082665152019925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,8192,0.008390222158696916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,16384,0.021330666210916307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,7168,0.008949333594905006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,12288,0.018535999788178336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,6144,0.00831911133395301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,10240,0.01757777730623881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,5120,0.00793333351612091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,8192,0.016196444630622864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,4096,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,3584,0.0069164443347189165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,6144,0.01514488955338796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,3072,0.006278222219811545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,5120,0.01479822231663598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,2560,0.005636444522274866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,4096,0.013519110778967539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,2048,0.005203555441564984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,3584,0.01404266721672482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,1536,0.004932444542646408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,3072,0.013096888860066732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,1024,0.0041893331540955436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,2560,0.01311466677321328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,768,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,2048,0.012395555774370829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,1536,0.012406222522258759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,512,0.003321777822242843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,256,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,1024,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,128,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,768,0.011759111450778114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,64,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,512,0.01142133358452055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,256,0.011032000184059143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,128,0.010341333018408881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,64,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,65536,0.017613333132531907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,32,0.010407999985747868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,51200,0.015962666935390897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,16384,0.010326222413116032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,65536,0.05383911066585117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,12288,0.010000000397364298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,51200,0.04474844535191854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,16384,0.020848888489935134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,10240,0.009016888837019602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,1536,0.005864000154866113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,8192,0.008292444050312042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,7168,0.008839999636014303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,12288,0.01899111105336083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,10240,0.017162667380438913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,6144,0.008616000413894653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,8192,0.016173332929611206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,5120,0.00793333351612091
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,7168,0.015809777710172866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,6144,0.015235554840829639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,5120,0.014479110638300577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,3584,0.0069004446268081665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,1024,512,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,4096,0.013481777575280933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,2560,0.006242666807439592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,3584,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,2048,0.005921777751710679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,3072,0.013463111387358772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,1536,0.004287111262480418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,768,32,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,2048,0.012093333734406365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,1024,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,1536,0.012455110748608908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,768,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,1024,0.011356444822417365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,512,0.003152888889114062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,512,0.011351111034552256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,256,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,768,7168,0.015933333171738517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,128,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,256,0.01106844428512785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,64,0.002570666579736604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,4096,0.007258666886223688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,32,0.002793777734041214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,128,0.011553777588738335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,65536,0.017196445001496207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,64,0.010703110860453712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,512,3072,0.006630222416586346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,51200,0.0144533332851198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,32,0.010341333018408881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,16384,0.009299555586444007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,12288,0.00794400026400884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,65536,0.052151110437181264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,10240,0.007351111206743453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,2560,0.013066666821638743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,16384,0.02070755594306522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,8192,0.0069422221018208405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,12288,0.01850222216712104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,7168,0.006301333506902059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,6144,0.0069191112286514705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,10240,0.017862222260899015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,8192,0.016043555405404832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,5120,0.006664888726340399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,4096,0.0064497776329517365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,7168,0.015487111277050443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,3584,0.006016888966162999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,6144,0.01479022204875946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,512,768,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,3072,0.005609777652555042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,2560,0.005568000177542369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,4096,0.013423999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,3584,0.013758222262064615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,3072,0.013422222601042854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,2560,0.013174222575293647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,1536,0.00453333349691497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,1024,0.004107555581463708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,2048,0.012096888489193387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,768,0.0035386664999855887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,1536,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,1024,0.012107555237081317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,768,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,256,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,512,0.012044444680213928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,128,0.0025395556456512874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,256,0.01105955574247572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,64,0.002567111204067866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,51200,0.042295111550225147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,128,0.011427555647161273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,32,0.0025395556456512874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,65536,0.014803555276658801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,64,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,51200,0.0123848890264829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,32,0.01035377797153261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,16384,0.008009778128729926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,65536,0.04999377661281162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,12288,0.00793688909875022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,51200,0.04071911176045736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,256,5120,0.014800889624489678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,10240,0.006907555378145642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,16384,0.021278222401936848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,8192,0.006577777779764599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,2048,0.00527555536892679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,7168,0.00628266649113761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,12288,0.018933332628673978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,6144,0.006241777704821692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,10240,0.01787911189926995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,5120,0.0059057776298787855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,8192,0.016192000773217943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,4096,0.005558222118351195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,7168,0.015507555670208402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,3584,0.005786666853560342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,6144,0.01510933372709486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,3072,0.005618666609128316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,5120,0.01479822231663598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,2560,0.005889777921968036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,4096,0.013810666898886362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,256,512,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,3584,0.013778666655222574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,1536,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,1024,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,2560,0.013443555268976422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,768,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,2048,0.012460444536474017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,512,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,1536,0.012062222593360476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,256,0.00291377781993813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,1024,0.011047110789351992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,128,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,768,0.012086222569147745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,512,0.011774222056070963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,256,0.011011555790901184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,32,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,128,0.010386666489972008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,65536,0.011571555501884885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,64,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,32,0.009709333380063375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,51200,0.010495111346244812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,65536,0.05004533463054233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,16384,0.0069288888739215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,51200,0.04072177741262648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,12288,0.006573333508438534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,10240,0.006243555496136348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,16384,0.0209840006298489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,8192,0.006577777779764599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,12288,0.018224888377719455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,7168,0.006225777582989798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,10240,0.016855110724767048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,2048,0.0052488889131281115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,6144,0.005579555614127054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,8192,0.01614488826857673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,128,3072,0.013415999710559845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,5120,0.005618666609128316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,4096,0.00573511090543535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,3584,0.006214222146405115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,6144,0.01477599971824222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,5120,0.014474666780895658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,3072,0.0052168890833854675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,2560,0.005620444400442972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,3584,0.013741333451535968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,128,64,0.002522666628162066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,2048,0.005882666756709416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,3072,0.013434666726324292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,1536,0.0042133331298828125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,2560,0.012720888687504662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,1024,0.0038293335172865125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,768,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,2048,0.012757333616415659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,1536,0.0123831108212471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,512,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,256,0.0029102222373088202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,768,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,128,0.0028008888992998335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,512,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,64,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,256,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,64,32,0.002483555633160803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,128,0.011316444310877057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,65536,0.011004444625642566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,51200,0.01038933296998342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,64,0.011065777805116443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,32,0.01038933296998342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,16384,0.0069777775141927935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,12288,0.0069644442862934535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,65536,0.049750222100151904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,51200,0.04073955615361532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,10240,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,16384,0.021290666527218286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,8192,0.00627377794848548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,7168,0.006270222365856171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,7168,0.015449777245521545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,10240,0.017276444368892245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,8192,0.01651733285850949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,6144,0.005550222264395819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,5120,0.005527110977305307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,7168,0.015635554989178974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,4096,0.0052373334765434265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,3584,0.005595555735958948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,6144,0.014793778459231058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,5120,0.014730667074521383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,3072,0.0052560000783867305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,4096,0.013802666631009845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,3584,0.013784888717863293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,2048,0.005246222019195557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,3072,0.013440888788965015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,1536,0.004546666724814309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,2560,0.013071111506885953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,1024,0.011090666883521609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,1024,0.0038328886859946777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,768,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,1536,0.012747555143303342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,512,0.0032026666320032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,1024,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,768,0.01108000013563368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,256,0.0029440000653266907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,128,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,512,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,64,0.0025031111306614345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,256,0.0111191107167138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,128,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,32,0.0024888888001441956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,64,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,32,0.011030221978823343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,64,4096,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,16384,0.32167911529541016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,11,32,2560,0.005791999813583162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,16384,0.17086399926079643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,51200,0.4970533582899306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,2048,0.012100444071822695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,12288,0.24499556753370497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,12288,0.15148177411821154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,10240,0.1884240044487847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,51200,0.9633608924018012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,7168,0.13354933261871338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,8192,0.1545004447301229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,6144,0.11524621645609538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,10240,0.13211022482977972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,7168,0.10511555274327596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,8192,0.1367031070921156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,6144,0.09260177612304688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,11,32,12288,0.018536888890796237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,3584,0.06923466920852661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,5120,0.08061155345704821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,4096,0.08129688766267565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,3072,0.05992088715235392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,4096,0.06856799787945218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,2560,0.050605333513683744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,5120,0.09715288877487183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,2048,0.04184000028504265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,3072,0.06057422028647529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,1024,0.024029332730505202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,2560,0.04706844356324938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,2048,0.04029777646064758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,768,0.018580444984965853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,512,0.013432888521088494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,1536,0.0343502230114407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,1024,0.028177777926127117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,256,0.008263111114501953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,768,0.02325244413481818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,128,0.006596444381607904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,512,0.018032888571421306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,256,0.016951999730534024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,128,0.013803555733627744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,32,0.0059368887709246735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,64,0.014430221584108142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,32,0.015861334072219003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,65536,3584,0.06458399693171184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,65536,0.5252898004319932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,1536,0.03240711159176297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,51200,0.8225822448730469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,16384,0.13865333133273655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,16384,0.2781146632300483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,65536,64,0.005596444424655702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,51200,0.40007466740078396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,12288,0.20264266596900093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,10240,0.17608888943990073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,12288,0.14789599842495388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,8192,0.140611555841234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,10240,0.10584355725182427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,7168,0.12307466400994195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,6144,0.10627022054460313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,7168,0.08343911170959473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,6144,0.0747493306795756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,5120,0.08887466457155015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,4096,0.0731031099955241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,8192,0.09691022502051459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,5120,0.06407022476196289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,3584,0.06405866808361478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,4096,0.05753511190414429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,3072,0.055493334929148354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,3584,0.054767999384138316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,2048,0.037928889195124306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,3072,0.04582133226924472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,1536,0.02949955397182041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,2560,0.040377779139412776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,2048,0.03349599904484219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,768,0.01603822244538201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,65536,1.0904613071017795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,1024,0.024079999989933435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,512,0.011552000211344825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,1536,0.03045155604680379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,768,0.02095199955834283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,128,0.0041982221106688184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,512,0.01776977711253696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,64,0.003543111185232798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,256,0.01512977812025282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,32,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,128,0.012487110992272695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,64,0.01481066644191742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,256,0.00758844448460473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,51200,32,0.014567111929257711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,65536,0.31800444920857746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,51200,0.2503902117411296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,65536,0.18610666857825386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,2560,0.04679377873738607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,16384,0.09056799941592747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,12288,0.07067644596099854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,10240,0.05410933494567871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,51200,1024,0.021199999584092036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,16384,0.05632177988688151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,12288,0.053512000375323825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,7168,0.03806311223242018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,6144,0.03324888812171088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,8192,0.04366755485534668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,7168,0.03781333234575059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,5120,0.029096000724368628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,4096,0.024319999747806128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,6144,0.03619199991226196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,5120,0.031158222092522517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,3584,0.020946666598320007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,3072,0.018765333626005385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,4096,0.026550221774313185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,2560,0.01590755581855774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,3584,0.025827555192841425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,3072,0.0247715562582016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,2048,0.013399110900031196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,2560,0.022504000200165644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,1536,0.010774222513039907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,2048,0.019111111760139465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,1024,0.008360889222886827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,51200,0.14103910658094618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,1536,0.017872888180944655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,768,0.0069297779765393995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,512,0.005158222383923001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,1024,0.015241778559154935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,256,0.0033866665843460294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,768,0.014451555079884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,128,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,64,0.002875555513633622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,512,0.012862222062216865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,8192,0.04541777902179294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,16384,32,0.002987555538614591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,256,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,128,0.011392888923486074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,10240,0.05016977919472588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,64,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,16384,0.06680355469385783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,65536,0.25395822525024414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,51200,0.19900800122155082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,16384,32,0.0114702218108707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,12288,0.0524453322092692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,51200,0.12211288346184625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,10240,0.04499288731151157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,16384,0.04998133248753018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,8192,0.036905778778923884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,12288,0.05398311217625936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,7168,0.03262133399645487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,6144,0.02903288933965895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,8192,0.03844088978237576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,10240,0.04513422316975064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,7168,0.034287999073664345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,4096,0.020246222615242004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,3584,0.01759022143152025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,5120,0.027574222948816087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,3072,0.015524443652894763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,4096,0.02586311101913452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,2560,0.013088000317414602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,3584,0.02485688858562046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,2048,0.011333333121405708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,3072,0.021887999441888597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,1536,0.009600888523790572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,2560,0.020284444093704224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,2048,0.01791200041770935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,1024,0.007639110916190677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,768,0.006495111104514863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,1536,0.01715555621518029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,512,0.004576000074545543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,1024,0.014441778262456259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,256,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,768,0.013942221800486246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,128,0.0031973332580592898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,512,0.01240799989965227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,64,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,256,0.011720000041855706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,32,0.0032213332338465583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,64,0.011375111010339526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,32,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,12288,5120,0.025366221865018208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,6144,0.034985777404573225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,65536,0.21770932939317492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,16384,0.059099555015563965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,51200,0.17304710547129312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,65536,0.1507893270916409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,12288,0.046741333272722035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,51200,0.11775378386179607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,10240,0.03830044468243917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,16384,0.04771733283996582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,12288,0.04379377762476603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,10240,0.03973599937227037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,8192,0.032115555471844144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,6144,0.026018665896521673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,8192,0.033095998896492854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,5120,0.022496889034907024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,7168,0.03150399857097202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,4096,0.018227555685573153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,65536,0.15666311317019993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,6144,0.028312000963422988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,3584,0.016125332978036668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,5120,0.024688000480333965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,3072,0.014292443792025248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,12288,128,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,2560,0.012320888539155325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,2048,0.010954666468832227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,3584,0.021448888712459143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,3072,0.019537778364287484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,1536,0.009116444322797988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,2560,0.018589332699775696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,1024,0.007602666815121968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,768,0.0058666666348775225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,2048,0.017283555534150865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,1536,0.01551999979548984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,512,0.004879999905824661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,1024,0.014105778601434497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,768,0.01315111087428199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,128,0.0032302221904198327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,512,0.012080888781282636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,256,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,64,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,32,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,128,0.010689777632554373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,64,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,7168,0.029213332467608984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,32,0.01071466671095954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,65536,0.1739671097861396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,51200,0.13077510727776423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,16384,0.04561511013242933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,65536,0.10134755240546332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,51200,0.07910311222076416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,12288,0.0330062210559845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,10240,0.027456889549891155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,8192,0.02500533395343357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,12288,0.03715288970205519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,16384,0.03606133328543769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,10240,4096,0.022663111488024395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,7168,0.021779555413458083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,6144,0.018904000520706177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,10240,0.03140711122088962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,5120,0.016533333394262526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,8192,0.026918222506841023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,4096,0.014416888356208801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,7168,0.025239111648665533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,3584,0.012461333639091916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,6144,0.023365333676338196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,3072,0.011511999699804517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,5120,0.021306667062971327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,2560,0.009911110831631554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,10240,256,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,3584,0.01923288901646932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,2048,0.008652444514963362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,1536,0.007306666837798224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,3072,0.017846221725145977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,2560,0.01648000048266517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,768,0.004574222283230888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,2048,0.015178667174445258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,512,0.0038151111867692736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,1536,0.014135999812020196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,1024,0.013417777915795645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,256,0.0031946665710873077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,768,0.012511110968059964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,128,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,64,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,512,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,32,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,256,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,128,0.010703999963071613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,64,0.012065778175989786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,32,0.01070844464831882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,65536,0.1478817727830675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,51200,0.11656710836622451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,16384,0.04174933168623182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,65536,0.09321422047085232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,12288,0.03290311164326138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,10240,0.028146667612923518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,16384,0.03435644507408142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,12288,0.035888890425364174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,8192,0.021799110703998145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,7168,0.020558221472634208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,10240,0.030702223380406696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,8192,0.026153778036435444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,8192,4096,0.01957155598534478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,5120,0.015420445137553744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,7168,0.02439111140039232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,4096,0.013263111313184103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,8192,1024,0.005537777725193236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,6144,0.02251111136542426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,3584,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,5120,0.02064622276359134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,3072,0.010655110908879174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,2560,0.009694221946928237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,4096,0.019644444187482197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,2048,0.008310221963458592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,3584,0.018225777480337355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,3072,0.017491555876202054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,1536,0.007241778075695038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,1024,0.005162666655249066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,2560,0.016140444411171805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,2048,0.014745778507656522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,768,0.004182222402758068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,512,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,1536,0.013754666679435305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,256,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,1024,0.012711111042234631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,128,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,768,0.012773333324326409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,512,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,64,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,32,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,128,0.010694222317801582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,51200,0.07239733139673869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,64,0.011378666592968835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,32,0.011431111229790581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,65536,0.1226195494333903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,51200,0.0975688894589742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,65536,0.08501511149936253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,16384,0.03559733430544535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,12288,0.028675556182861328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,7168,6144,0.018127111925019156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,10240,0.024658666716681585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,16384,0.03214222192764282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,8192,0.02128355536195967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,12288,0.030692444907294378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,7168,0.019066666563351948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,10240,0.02787644333309597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,6144,0.016937777400016785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,8192,0.025369778275489807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,5120,0.015452444553375244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,7168,0.022635555929607813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,4096,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,6144,0.0226248883538776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,3584,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,5120,0.020225778222084045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,3072,0.010320888625250923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,4096,0.01830933325820499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,3584,0.01841600073708428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,7168,256,0.011401777466138205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,3072,0.016977777083714802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,2048,0.00793511089351442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,1536,0.006734222173690796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,2560,0.015485333071814643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,1024,0.004581333448489507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,2048,0.013988445202509562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,768,0.004152889053026835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,1536,0.013396444420019785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,512,0.003871110992299186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,1024,0.012798222402731577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,51200,0.06604622470008002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,256,0.0031519999934567344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,768,0.01240355521440506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,128,0.0028906667398081887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,512,0.011095999843544431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,64,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,256,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,128,0.01072799993885888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,64,0.01071466671095954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,6144,32,0.0107004443804423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,65536,0.10680088731977676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,51200,0.08527288834253947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,16384,0.031888888941870794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,65536,0.07778577672110663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,12288,0.025798221429189045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,51200,0.06054844458897909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,16384,0.029425776667065088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,10240,0.02218577762444814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,8192,0.019859555694792006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,12288,0.028408000866572063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,7168,0.01737511157989502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,6144,0.015831111205948722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,10240,0.02606311109330919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,6144,2560,0.008971555365456475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,5120,0.013861333330472311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,4096,0.01202488856183158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,7168,0.022310222188631695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,3584,0.010528888967302112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,3072,0.009352888498041365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,6144,0.021149333980348375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,5120,0.019223110543357003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,2560,0.00849866701496972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,2048,0.0073902226156658595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,3584,0.01756000022093455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,3072,0.0162462227874332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,1536,0.0058755555914507965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,2560,0.014476444986131458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,1024,0.004552888787455029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,768,0.004218666503826777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,2048,0.014172444740931192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,512,0.003524444583389494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,1536,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,256,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,768,0.012426666915416718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,128,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,512,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,64,0.002516444358560774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,256,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,5120,32,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,128,0.010679110884666443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,64,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,65536,0.08578399817148845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,32,0.01033333357837465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,51200,0.06768622001012166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,16384,0.027678221464157104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,65536,0.07154755459891425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,51200,0.05630577935112847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,12288,0.021672000487645466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,10240,0.01923822197649214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,8192,0.02551288902759552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,16384,0.025807999902301367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,8192,0.017136888371573556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,12288,0.027451554934183758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,7168,0.013975110318925647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,10240,0.025217778152889673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,4096,0.018069333500332303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,6144,0.012373333175977072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,5120,0.010890666809346942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,8192,0.022662222385406494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,4096,0.010035555395815108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,6144,0.020250666472646926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,3584,0.008861333131790161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,5120,0.018197332819302876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,3072,0.008120888637171851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,5120,1024,0.012795555922720166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,2560,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,3584,0.016395555602179635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,2048,0.006256888724035687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,3072,0.014803555276658801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,1536,0.004791999856630961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,2560,0.0141004439857271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,1024,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,2048,0.014108444253603617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,768,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,1536,0.01312444441848331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,1024,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,256,0.0028799999919202593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,768,0.012413333687517377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,128,0.002855111120475663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,256,0.01204177737236023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,64,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,128,0.011570666399266986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,4096,32,0.0024906665914588505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,64,0.011085333095656501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,32,0.01071200023094813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,7168,0.02095199955834283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,65536,0.07768799861272176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,51200,0.06036444505055746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,4096,0.017272889614105225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,65536,0.06881688700781928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,51200,0.05483733283148872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,12288,0.01907911068863339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,10240,0.0165955556763543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,16384,0.02490666674243079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,12288,0.02637600070900387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,10240,0.024529778295093115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,7168,0.013754666679435305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,8192,0.02199555602338579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,6144,0.012084444363911947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,7168,0.020615999897321064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,5120,0.010570666856235929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,6144,0.020233778489960563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,4096,0.009939555492666032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,3584,0.008608000146018134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,4096,0.016157334049542744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,3072,0.00793599999613232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,3584,0.016168889072206285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,2560,0.006919999917348226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,3072,0.014644443988800049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,2048,0.005568000177542369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,16384,0.023631999890009563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,1536,0.0046977777447965415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,2048,0.01309511148267322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,1024,0.003903999924659729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,1536,0.012448888685968188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,8192,0.01459822224246131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,768,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,512,0.0032622222271230486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,1024,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,256,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,768,0.012079111403889127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,512,0.011028444601429833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,256,0.011041777829329172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,4096,512,0.011766222616036734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,32,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,128,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,5120,0.018203554881943595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,64,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,65536,0.06332266992992826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,32,0.0107004443804423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,51200,0.05059555504057142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,16384,0.02077866593996684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,12288,0.016979555288950603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,65536,0.0662062234348721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,51200,0.052998221582836576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,10240,0.016893333858913846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,16384,0.024738666084077623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,8192,0.014931556251313953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,12288,0.026572444372706946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,7168,0.012678222523795234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3584,2560,0.013825777504179211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,6144,0.011041777829329172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,5120,0.010159999959998662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,8192,0.020995555652512446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,7168,0.019560888409614563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,4096,0.009276444713274637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,6144,0.018755555152893066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,3584,0.0081377774477005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,3072,0.007607111500369177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,5120,0.017014222012625802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,2560,0.006310222049554189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,4096,0.015107555521859063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,2048,0.005393777870469623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,3072,0.014098667436175875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,1536,0.004562666846646203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3584,128,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,2048,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,1024,0.003879111260175705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,1536,0.012475555141766867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,768,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,1024,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,512,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,768,0.012073777616024017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,256,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,512,0.011416888899273343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,128,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,256,0.01125955581665039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,64,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,128,0.010680889089902243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,10240,0.02221244408024682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,3072,32,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,64,0.010925333533022137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,65536,0.05758577585220337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,32,0.01107377807299296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,51200,0.04495733314090305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,16384,0.01884355478816562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,65536,0.06362222300635444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,3584,0.015122666954994202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,12288,0.015440000428093804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,51200,0.05136977632840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,10240,0.014148443937301636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,3072,2560,0.013432888521088494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,8192,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,16384,0.024000888069470722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,7168,0.012016889121797351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,12288,0.02331466641690996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,6144,0.011001778145631155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,5120,0.010317333042621613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,10240,0.022039999564488728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,4096,0.008960888617568547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,8192,0.01960711181163788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,3584,0.007853333320882585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,3072,0.006955555743641323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,7168,0.018412444326612685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,6144,0.01718488832314809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,5120,0.015684444043371413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,2048,0.0052177777720822235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,3584,0.014192000031471252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,1536,0.004466666529575984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,3072,0.013739555246300168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,1024,0.003859555555714501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,2560,0.01310755560795466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,2048,0.012958221965365939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,512,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,1536,0.012476444244384766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,1024,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,256,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,768,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,512,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,256,0.011152889165613385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,128,0.01038755559258991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,32,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,64,0.010781333678298526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,65536,0.05184622274504768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,32,0.010391111175219217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,51200,0.036728888750076294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,65536,0.0613973339398702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,16384,0.016515556308958266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,51200,0.04966400067011515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,12288,0.014709333578745524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,16384,0.023782221807373896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,2560,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,10240,0.013405332962671915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2560,4096,0.014783110883500842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,12288,0.023597333166334365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,8192,0.012299555871221753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,7168,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,6144,0.010288000106811523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,10240,0.020125332805845473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,8192,0.019167999426523846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,7168,0.01703733371363746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,4096,0.008208889100286696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,6144,0.015226667126019796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,128,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,3584,0.007304000357786815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,5120,0.014961777461899651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,3072,0.006243555496136348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,2560,0.00572533326016532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,2048,0.004913777940803104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,3584,0.013566222455766467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,1536,0.004524444540341695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,3072,0.01366666704416275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,1024,0.0038817777401871155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,2560,0.013086222112178802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,2048,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,1536,0.012447111308574677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,512,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,1024,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,256,0.003014222201373842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,512,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,128,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,256,0.011774222056070963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,64,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,128,0.011078221930397881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,64,0.01145333300034205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2560,768,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,5120,0.009662222531106737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,32,0.011028444601429833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,65536,0.0362026658323076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,51200,0.02915289004643758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,16384,0.014081777797804939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,65536,0.05884266561932034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,51200,0.04833155539300707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,4096,0.014191110928853353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,12288,0.012674666941165924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,10240,0.01127199994193183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,16384,0.02330488959948222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,8192,0.010505778094132742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,7168,0.009687999884287516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,12288,0.02127555509408315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,10240,0.019401777121755812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,6144,0.009871111147933537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,8192,0.01680444512102339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,5120,0.008519111408127679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,7168,0.015917332635985482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,4096,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,3584,0.006960888703664144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,2048,768,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,6144,0.01551822159025404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,3072,0.006287999865081575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,5120,0.01475822263293796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,2560,0.005882666756709416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,4096,0.013961777091026306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,2048,0.0052284445199701525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,3584,0.013775111072593264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,1536,0.004527111020353106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,3072,0.013755555782053204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,1024,0.003951999876234266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,2560,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,768,0.0035075553589397003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,2048,0.012729778057999082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,512,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,256,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,1024,0.012103999654452005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,128,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,768,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,512,0.011022222538789114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1536,32,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,256,0.01069777790043089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,65536,0.025996444953812495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,64,0.01070666644308302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,32,0.011071999867757162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,51200,0.021677333447668288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,16384,0.011898666620254517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,65536,0.05594311157862345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,12288,0.011689778003427716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,51200,0.045187556081347995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,10240,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,16384,0.021631111701329548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,8192,0.009076444639099969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,2048,768,0.0036319999231232535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,12288,0.019885333047972787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,7168,0.009663110805882348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,10240,0.017616000440385606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,6144,0.008976889153321585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,8192,0.016184889607959323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,5120,0.007928888830873702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,4096,0.007305777735180325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,6144,0.015476443701320224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,3584,0.00674044465025266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,4096,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,3072,0.00628977765639623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,3584,0.013432888521088494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,2560,0.005884444548024072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,3072,0.013167999684810638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,2048,0.006638222270541721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,2560,0.013109332985348172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,1536,0.0052488889131281115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,128,0.011436444189813403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,2048,0.012617777619096967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,1536,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,768,0.0038942222793896994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,1024,0.011375111010339526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,512,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,768,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,256,0.003152888889114062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,512,0.011021333436171213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,128,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,256,0.011386666860845355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,7168,0.01575999955336253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,64,0.002519999941190084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,32,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,128,0.011020444333553314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,5120,0.014142221874660917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,65536,0.023344889283180237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,64,0.010739555789364709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,51200,0.01928711103068458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1024,32,0.011071110765139261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,16384,0.01132266637351778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,12288,0.010943111446168689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,1536,1536,0.012223111258612739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,51200,0.04449866546524895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,16384,0.021262221866183813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,8192,0.008340444829728868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,10240,0.017303999927308824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,1024,1024,0.004521777646409141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,7168,0.009333333207501305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,8192,0.016160888804329764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,6144,0.008624888956546783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,7168,0.016158221496476066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,5120,0.008006222546100616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,4096,0.007323555648326874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,6144,0.014827556080288358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,3584,0.0069475554757648045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,5120,0.01444355481200748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,3072,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,4096,0.013991110854678683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,2560,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,3584,0.013430222041077085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,2048,0.005207111024194294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,3072,0.01312444441848331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,1536,0.004925333377387789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,2560,0.013091555900043912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,1024,0.0041946665280395085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,2048,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,768,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,1536,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,65536,0.05484088924196032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,512,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,10240,0.00941955546538035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,1024,0.012169777519173093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,256,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,128,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,768,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,12288,0.018552889426549275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,512,0.011053333679835001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,768,32,0.0027093332674768236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,256,0.01074222226937612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,65536,0.01720711092154185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,128,0.010371555884679159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,51200,0.0158924443854226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,64,0.010701333483060202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,16384,0.010404444403118556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,768,32,0.009705777797434065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,12288,0.010041777458455827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,10240,0.008952000074916417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,51200,0.043824000491036304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,8192,0.008264000217119852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,16384,0.020977778567208186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,7168,0.008997333546479544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,12288,0.018414222531848483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,6144,0.008294222255547842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,10240,0.01721333298418257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,5120,0.00794933322403166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,8192,0.016179554992251925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,4096,0.007275555696752336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,7168,0.015807999504937064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,6144,0.014803555276658801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,5120,0.01443199978934394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,4096,0.013743999931547375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,2560,0.0062773335311147906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,3072,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,2048,0.005881777654091517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,2560,0.012421333127551608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,1536,0.004511111312442356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,2048,0.012114666402339935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,1024,0.003822222352027893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,1536,0.012025777664449481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,768,0.0034968890249729156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,1024,0.011416888899273343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,512,0.0032231110251612137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,768,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,256,0.002924444360865487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,512,0.011015111373530494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,128,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,256,0.01071733319097095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,64,0.002524444419476721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,128,0.010056888891590966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,3584,0.006919999917348226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,64,0.010661332971519895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,3072,0.006257777826653586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,65536,0.017151999804708693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,51200,0.014640889234013028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,3584,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,16384,0.009324444664849175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,65536,0.051870223548677236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,12288,0.007996444072988298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,51200,0.041401777002546526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,10240,0.007364444434642792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,16384,0.02092444399992625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,8192,0.0069520001610120135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,12288,0.018365333477656048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,7168,0.006607111129495833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,10240,0.01748533381356133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,6144,0.006970666348934174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,8192,0.016142222616407607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,5120,0.006597333484225803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,7168,0.015484443969196744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,4096,0.005942222144868638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,6144,0.015287111202875773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,3584,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,5120,0.014444443914625378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,3072,0.005550222264395819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,65536,0.05341955688264635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,4096,0.013460444079505073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,3584,0.013111111190583972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,3072,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,2048,0.00590133335855272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,512,32,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,2560,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,1536,0.004535111288229625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,1024,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,2048,0.012857777376969656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,512,32,0.009649777577983009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,1536,0.012038222617573209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,768,0.0035582222044467926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,512,0.0032026666320032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,256,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,1024,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,128,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,768,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,512,0.012042666474978128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,64,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,256,0.010812444819344414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,32,0.002479111154874166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,65536,0.014712888333532544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,128,0.010064000056849586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,51200,0.012411555482281579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,64,0.01069866700304879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,16384,0.007958222594526079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,65536,0.04935377836227417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,12288,0.00758844448460473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,51200,0.04079200161827935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,16384,0.020638222495714825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,10240,0.006631111105283101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,8192,0.006640888750553131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,12288,0.018532445033391316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,7168,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,10240,0.017495999733606975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,256,2560,0.005604444278611078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,8192,0.015857777661747403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,5120,0.0058959999846087555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,7168,0.015791111522250705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,6144,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,5120,0.014141332772043018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,3584,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,4096,0.013470222552617392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,3072,0.005264889034960005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,3584,0.013092444174819522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,2560,0.005601777798599667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,3072,0.013071999781661563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,2048,0.005558222118351195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,2560,0.012516444755925072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,1536,0.004555555681387584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,256,32,0.01036622209681405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,2048,0.01203644441233741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,1024,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,768,0.00332266671790017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,1536,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,512,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,1024,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,256,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,768,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,128,0.0028693332440323303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,512,0.0107342220014996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,64,0.002514666567246119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,6144,0.006020444548792309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,32,0.002479111154874166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,128,0.011393778026103973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,65536,0.011420444481902652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,51200,0.010407999985747868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,128,4096,0.005576000031497743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,32,0.009993777506881291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,16384,0.0069422221018208405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,65536,0.04996533195177714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,51200,0.04144355654716492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,10240,0.006639110959238476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,12288,0.018586667047606576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,8192,0.006576889091067844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,10240,0.01757955551147461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,7168,0.006270222365856171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,8192,0.016199999385409884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,6144,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,7168,0.015885333220163982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,5120,0.005962666538026597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,6144,0.015126221709781222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,4096,0.005560889012283749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,5120,0.0148044443792767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,3584,0.005927111125654644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,4096,0.013798221945762634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,256,0.010732444624106089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,3072,0.005548444473081165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,3584,0.014006222287813822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,128,64,0.010524444282054901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,3072,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,2560,0.013088888592190213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,1536,0.004538666870858935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,2048,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,16384,0.020823111136754353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,1024,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,1536,0.012415111064910889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,768,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,512,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,1024,0.011214222345087262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,768,0.01185955521133211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,256,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,512,0.01073688848151101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,128,0.0026791110220882627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,256,0.012110222544935016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,64,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,128,0.010727110836240979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,32,0.0026506665680143568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,64,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,65536,0.01144266708029641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,64,32,0.010021333065297868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,2560,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,51200,0.010626667075686984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,16384,0.0069271110826068455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,65536,0.05026488833957248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,2048,0.0052639999323421055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,12288,0.007313778003056844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,10240,0.006704000135262807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,51200,0.041073779265085854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,64,12288,0.006623111251327727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,8192,0.006747555401590135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,16384,0.020629333125220407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,7168,0.006299555715587404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,12288,0.018553778529167175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,6144,0.006251555350091722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,10240,0.017602667212486267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,8192,0.016136889656384785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,4096,0.005256888767083486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,6144,0.014462222655614218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,3584,0.005555555638339784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,5120,0.014479999740918478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,3072,0.005594666633341048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,4096,0.013471999930010902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,2560,0.005924444645643234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,2048,0.005600000007285013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,3584,0.013088888592190213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,3072,0.013111111190583972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,1536,0.004536889079544279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,2560,0.012449777788586087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,1024,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,768,0.0032142222755485107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,2048,0.013105777402718862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,512,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,1536,0.012372444073359171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,256,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,1024,0.011019555230935415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,768,0.011367110742463006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,512,0.011779555843936073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,64,0.002671111168132888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,256,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,32,0.0025235555238193935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,128,0.010042666561073726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,64,0.01143022212717268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,32,0.011011555790901184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,5120,0.005959110955397288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,10,32,7168,0.01553244392077128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,16384,0.32104089525010854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,51200,0.49603912565443253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,16384,0.17158310943179658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,12288,0.24524267514546713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,12288,0.1960000064637926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,10240,0.18782667318979898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,51200,0.9618924458821615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,8192,0.15456977155473497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,10240,0.12799999448988172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,10,32,128,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,5120,0.09660800298055013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,6144,0.1146799988216824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,6144,0.10841688844892715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,7168,0.1331919961505466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,4096,0.08060089084837171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,7168,0.1072124441464742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,5120,0.07904889186223348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,3584,0.06894310977723864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,3072,0.05997688902748955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,4096,0.07205866442786323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,2560,0.050400889582104154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,2048,0.04122577773200141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,3584,0.06397866540484957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,1536,0.03244977858331468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,2560,0.04839644498295254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,1024,0.023189332750108507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,768,0.018907555275493197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,1536,0.0347688893477122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,512,0.01351199961370892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,1024,0.02693155573474036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,256,0.008336889247099558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,128,0.00657066661450598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,512,0.018908444378111098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,64,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,768,0.02426044477356805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,256,0.015150222513410779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,65536,32,0.005613333235184352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,64,0.013813333378897773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,32,0.015519110692871941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,8192,0.11563289165496826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,3072,0.05738400088416206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,51200,0.3999848895602756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,65536,0.5234444406297472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,2048,0.043785777356889516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,51200,0.8484249114990234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,12288,0.21188444561428496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,16384,0.27837954627143013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,65536,1.0851590898301866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,65536,128,0.013771555489963956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,10240,0.17424710591634116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,8192,0.1413386662801107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,10240,0.10513689120610555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,7168,0.12401689423455133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,12288,0.12395111719767253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,6144,0.10595289203855728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,5120,0.08893511030409072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,4096,0.07247466511196561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,6144,0.07498755719926622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,7168,0.08444355593787299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,5120,0.066012442111969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,3584,0.06446311208936903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,4096,0.056073778205447726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,3072,0.05566222137875027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,2560,0.04692711101637947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,3584,0.054218666421042554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,2048,0.03932977716128031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,3072,0.04796977837880453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,1536,0.029883556895785864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,2560,0.043043557140562266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,1024,0.02147644427087572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,2048,0.03668977816899618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,768,0.01595288846227858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,1536,0.03019733230272929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,512,0.011534222298198275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,1024,0.022944889134830896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,768,0.02158044444190131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,128,0.00453599997692638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,512,0.017990221579869587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,64,0.0035182221068276297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,256,0.014126222994592456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,8192,0.09543466567993164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,32,0.0035386664999855887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,128,0.013202666408485837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,64,0.013782222237851886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,32,0.014548444085650973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,65536,0.31796712345547146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,51200,0.250619543923272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,65536,0.18219378259446886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,51200,0.1408568885591295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,16384,0.09029689100053574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,12288,0.07045866383446588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,16384,0.056440002388424344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,10240,0.05439022183418274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,8192,0.04432355695300632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,12288,0.06164444155163235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,10240,0.048476444350348584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,6144,0.03318666749530368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,8192,0.041667554113599986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,7168,0.04054666558901469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,5120,0.029040889607535467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,51200,256,0.0074755557709270054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,4096,0.024726221958796184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,6144,0.040022220876481794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,3584,0.02125955621401469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,3072,0.018509333332379658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,5120,0.03207022282812331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,4096,0.026763555076387193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,2560,0.015903110305468243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,3584,0.02610933283964793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,2048,0.01332444449265798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,1536,0.010678222609890832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,3072,0.023659555448426142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,1024,0.008429333567619324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,2560,0.022683555881182354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,768,0.0069057775868309875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,512,0.004875555634498596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,1536,0.018343110879262287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,2048,0.02029511166943444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,1024,0.015623999966515435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,128,0.0032293332947625052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,768,0.014558222558763293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,64,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,512,0.012800888882742988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,32,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,256,0.012732444538010491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,128,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,64,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,16384,32,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,65536,0.2525262302822537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,65536,0.15725421905517578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,51200,16384,0.13858844174279109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,7168,0.03807377815246582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,16384,0.06671200195948283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,12288,0.05196977655092875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,10240,0.04435111085573832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,16384,0.04970399869812859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,12288,0.04972889026006063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,7168,0.03283910950024923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,8192,0.037124445041020714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,10240,0.04681422313054403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,8192,0.04253244400024414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,6144,0.02875022093454997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,5120,0.025378665990299646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,7168,0.03542577889230516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,5120,0.027975112199783325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,4096,0.02015022271209293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,16384,256,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,3584,0.01757600075668759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,3072,0.015535111228624979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,6144,0.03195377853181627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,4096,0.02570844524436527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,2560,0.013399110900031196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,3584,0.024663999676704407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,2048,0.011528000235557556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,1536,0.009571555587980483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,3072,0.02258311046494378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,1024,0.007834666305118138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,2560,0.021199999584092036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,2048,0.018917333748605516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,1536,0.01742488808102078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,512,0.004902222090297275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,1024,0.01479200025399526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,256,0.0038613333470291565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,768,0.014147554834683737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,128,0.0031519999934567344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,51200,0.12203644381629096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,512,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,64,0.0031155554784668815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,256,0.012443555725945367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,32,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,128,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,64,0.011396444506115384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,12288,32,0.011556444068749746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,65536,0.21730932924482557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,51200,0.17226578129662407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,65536,0.15227111180623373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,16384,0.05920800235536364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,51200,0.11709600024753147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,12288,0.04627911249796549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,10240,0.037984887758890785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,16384,0.04794666502210829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,8192,0.03216177887386746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,7168,0.028833776712417603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,12288,0.045401778486039907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,10240,0.04127111037572225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,8192,0.031670222679773964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,6144,0.025888888372315302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,5120,0.022683555881182354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,7168,0.031089779403474595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,4096,0.01829777823554145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,768,0.006233777850866318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,3584,0.015824000040690105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,3072,0.014468444718254937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,4096,0.02328088879585266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,3584,0.02200088898340861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,2560,0.01240355521440506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,2048,0.01074044406414032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,3072,0.020278222031063504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,1536,0.008991999758614434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,2560,0.019314666589101154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,2048,0.017921777235137094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,1536,0.015743111570676167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,768,0.005920889063013925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,1024,0.01386844449573093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,512,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,768,0.013527111046844058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,256,0.0037164443896876443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,512,0.013096888860066732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,128,0.0031946665710873077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,256,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,64,0.002855111120475663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,128,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,32,0.0031635556370019913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,64,0.011069333387745751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,6144,0.027533332506815594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,32,0.011618666350841522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,10240,5120,0.024863999750879075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,12288,51200,0.19883733325534395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,51200,0.13075110647413465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,16384,0.045567999283472695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,65536,0.09652355644438003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,51200,0.07883555359310575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,10240,1024,0.007489778101444244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,16384,0.03665155503484938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,12288,0.03741777936617533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,8192,0.02567200031545427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,7168,0.021568000316619873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,10240,0.03094844354523553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,6144,0.019088000059127808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,7168,0.025817778375413682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,8192,0.02683111031850179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,5120,0.01649688846535153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,4096,0.014624888698259989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,6144,0.024864888853496973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,3584,0.012609778179062737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,5120,0.021164443757798936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,3072,0.011588444312413534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,4096,0.02060622142420875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,3584,0.018955555227067735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,3072,0.017831999394628737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,2048,0.008620444271299574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,2560,0.017512889371977914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,1536,0.007296889192528195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,2048,0.015876443849669564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,65536,0.17338755395677355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,1024,0.005869333528810077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,1536,0.01475822263293796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,768,0.004219555606444676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,512,0.0038906666967603895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,12288,0.03279733326699998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,1024,0.01276711126168569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,768,0.01309511148267322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,10240,0.02784444557295905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,128,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,512,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,256,0.003532444437344869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,64,0.0026746667507621977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,32,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,256,0.011239999698268043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,64,0.011770666473441653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,128,0.01068800025516086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,8192,32,0.01105955574247572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,65536,0.1491022242440118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,16384,0.04161333375506931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,65536,0.09422577752007379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,51200,0.11609778139326309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,12288,0.03306577934159173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,51200,0.07237422466278076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,10240,0.028021332290437486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,16384,0.03372177812788222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,8192,0.022089777721299067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,7168,0.02053155501683553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,12288,0.033597333563698664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,10240,0.029878222280078467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,6144,0.01812533371978336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,8192,2560,0.009963555468453301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,8192,0.026176888081762526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,4096,0.01346577786737018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,7168,0.02490844494766659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,3584,0.011974222130245633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,5120,0.020480889413091872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,3072,0.010936000280910067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,4096,0.019363555643293593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,2560,0.009543110926946005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,3584,0.01864622202184465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,2048,0.00832177781396442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,1536,0.007296889192528195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,3072,0.01759377784199185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,1024,0.005497777627574072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,2560,0.01688088807794783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,768,0.004538666870858935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,2048,0.01535022258758545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,1536,0.014459555347760519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,512,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,256,0.003145777723855443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,1024,0.012738666600651212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,128,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,768,0.013061333033773633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,512,0.012452444268597497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,256,0.01074399964676963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,64,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,32,0.0026506665680143568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,128,0.01074488874938753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,64,0.011092444260915121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,32,0.011339555184046427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,65536,0.1226560009850396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,16384,0.03565422362751431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,51200,0.09644444121254815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,65536,0.08569333288404678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,12288,0.028423110644022625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,51200,0.06618489159478082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,10240,0.024554666545655992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,7168,5120,0.01572177807490031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,12288,0.03176800078815884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,8192,0.02132622235351139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,16384,0.031826668315463595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,7168,0.01891288823551602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,6144,0.016927111479971144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,10240,0.0299653344684177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,5120,0.015236443943447538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,8192,0.0270471109284295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,4096,0.011398221883508893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,7168,0.02342133389578925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,3584,0.01032977799574534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,6144,0.021771555145581562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,3072,0.010312889185216691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,5120,0.019724445210562814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,2560,0.009018667042255402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,4096,0.01907999979125129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,2048,0.007696000238259633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,3584,0.018204443984561496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,1536,0.006864000111818314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,1024,0.004858666823969947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,2560,0.01590844492117564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,2048,0.014816888504558139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,768,0.004176889028814104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,1536,0.0141004439857271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,512,0.003551111039188173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,1024,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,256,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,128,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,768,0.01276622215906779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,512,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,64,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,256,0.010729778144094678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,6144,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,128,0.011083555718262991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,64,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,65536,0.10627555847167969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,32,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,51200,0.08467377556694879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,65536,0.07748533619774713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,51200,0.06078133318159315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,16384,0.03183555603027344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,12288,0.025975111458036635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,16384,0.029846221208572388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,12288,0.031567109955681696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,10240,0.0255377772781584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,8192,0.01956888867749108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,7168,0.017419555120997958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,6144,3072,0.017493334081437852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,6144,0.015473778049151102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,8192,0.025268443756633337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,5120,0.01388177772363027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,7168,0.022631999519136217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,4096,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,6144,0.021035555336210463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,3584,0.010423111418883005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,5120,0.01900888813866509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,3072,0.009679111341635386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,4096,0.018065777089860704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,2560,0.008550222549173567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,3584,0.01756533318095737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,2048,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,1536,0.005935110979610019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,3072,0.01644977761639489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,2560,0.015301333533393012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,1024,0.004548444516128964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,768,0.0042071110672420925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,2048,0.014126222994592456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,512,0.0037991110649373797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,1536,0.013515555196338229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,256,0.003145777723855443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,768,0.012773333324326409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,128,0.0028942223224374983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,512,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,64,0.002528888897763358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,7168,6144,0.022545778089099463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,256,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,32,0.002576888849337896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,5120,10240,0.02186044388347202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,64,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,65536,0.08578577968809341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,32,0.01110577748881446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,51200,0.06729155778884888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,16384,0.027515555421511333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,65536,0.07039999961853027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,12288,0.02197422252760993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,51200,0.05595022439956665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,16384,0.025937777426507738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,8192,0.01648533344268799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,7168,0.013771555489963956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,12288,0.026905778381559584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,10240,0.02428177826934391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,6144,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,8192,0.025255999631351892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,5120,0.011122666299343109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,7168,0.021143111917707656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,6144,0.01980177727010515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,5120,0.018544889158672757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,3584,0.008950221869680617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,4096,0.016843555702103507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,3584,0.016480889585283067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,1024,0.012383999923865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,3072,0.015276443627145557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,2048,0.006275555739800136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,2560,0.01482488877243466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,1536,0.004879111217127906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,2048,0.013752889302041797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,5120,128,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,1024,0.0038684445122877755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,768,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,1536,0.013090666797426013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,1024,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,256,0.0031848889258172777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,768,0.012278222375445895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,128,0.0028000000036425064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,10240,0.018978666928079393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,512,0.011778666741318174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,256,0.011784888803958893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,32,0.00254488881263468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,128,0.010728889041476779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,64,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,65536,0.07760355869928996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,4096,32,0.01071466671095954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,4096,0.010337777435779572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,51200,0.06013422542148166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,16384,0.023919110496838886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,12288,0.018981332580248516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,65536,0.06766133175955878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,10240,0.016576889488432143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,3072,0.007958222594526079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,16384,0.0251920007997089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,51200,0.054359111520979136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,8192,0.014833778142929077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,12288,0.026542221506436665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,7168,0.013753777576817406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,10240,0.023061333431137934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,6144,0.01180622229973475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,5120,0.01051644484202067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,4096,2560,0.006984000404675801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,8192,0.021831111775504217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,4096,0.00976533359951443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,7168,0.020222221811612446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,3584,0.008551110823949179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,6144,0.0189057770702574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,3072,0.007631999750932057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,5120,0.018205333087179396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,2560,0.006945778098371293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,2048,0.0057555557125144536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,4096,0.016194666425387066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,1536,0.004551110996140374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,3584,0.015484443969196744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,3072,0.014487110906177096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,1024,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,2560,0.013971555564138623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,768,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,2048,0.013471999930010902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,512,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,256,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,1536,0.013542222479979197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,1024,0.01202311118443807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,128,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,768,0.012108444339699216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,64,0.002475555572244856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3584,32,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,256,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,128,0.011401777466138205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,65536,0.06377244657940336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,64,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,32,0.010018666585286459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,51200,0.050498667690489024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,12288,0.017522666189405654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,65536,0.06443022357092963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,51200,0.052705778015984424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,10240,0.01676977839734819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,8192,0.015104888214005364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,12288,0.02401688860522376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,7168,0.012619555824332766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,10240,0.02232355541653103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,6144,0.011289777855078379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,8192,0.020853334003024634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,5120,0.010048888623714447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,7168,0.019241778386963736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,4096,0.009322666459613377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,6144,0.018201778332392376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,3584,0.008289777570300633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,5120,0.016579555140601266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,3072,0.007599111232492659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,4096,0.01514755520555708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,2560,0.0063457778758472866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,3584,0.015133332875039844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,2048,0.005277333160241445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,3072,0.014436443646748861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,1536,0.004562666846646203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,2560,0.014129777749379476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,1024,0.003866666720973121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,2048,0.013371555341614617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3584,512,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,768,0.003576888806290097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,1536,0.012831110921170978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,512,0.0031848889258172777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,256,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,1024,0.012420444852775998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,16384,0.02026844521363576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,512,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,64,0.0026417778184016547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,256,0.010689777632554373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,16384,0.024559110403060913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,32,0.0027537778433826235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,128,0.011061333119869232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,65536,0.05732444259855482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,64,0.010748444332016839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,51200,0.044974221123589404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,16384,0.019142222073343065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,65536,0.06284266710281372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,51200,0.05084977878464592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,12288,0.01612444387541877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,10240,0.014358222484588623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,16384,0.023940443992614746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,8192,0.012720888687504662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,12288,0.023235556152131822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,7168,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,10240,0.021871111459202234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,8192,0.020637333393096924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,6144,0.010713777608341642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,5120,0.010098666780524785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,7168,0.01854311095343696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,4096,0.008991999758614434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,6144,0.01717066599263085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,3584,0.007806222471925948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,5120,0.015501333607567681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,4096,0.014477334088749357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,3072,0.007258666886223688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,768,0.012116444607575735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,3584,0.014480888843536377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,2560,0.006280888699822956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,2048,0.005199999858935674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,3072,0.013773333695199756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,1536,0.004560889055331548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,2560,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,2048,0.012857777376969656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,1024,0.003839111162556542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,768,0.0037644443412621817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,3072,32,0.01000088867213991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,1536,0.012721777790122561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,512,0.003185777821474605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,256,0.0031306667046414483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,1024,0.011776888536082374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,128,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,768,0.012083555261294046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,512,0.011402666568756104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,64,0.002542222125662698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,256,0.011005333728260465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,128,0.010684444672531553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,64,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,65536,0.05072711242569817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,51200,0.036679999695883855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,65536,0.06023910972807142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,16384,0.016574222180578444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,51200,0.04974666568968031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,12288,0.014722666806644864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,16384,0.023652444283167522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,3072,128,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,10240,0.013579555683665805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,8192,0.012612444659074148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,12288,0.02205955485502879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,7168,0.0111191107167138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,10240,0.020209777686331008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,8192,0.018945778409639995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,6144,0.0105253333846728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,5120,0.009349333743254343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,7168,0.01734133395883772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,4096,0.008095111283991072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,6144,0.01555999947918786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,5120,0.01513155632548862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,4096,0.014096889230940076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2560,32,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,3072,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,2560,0.00555644432703654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2560,32,0.010016889207892949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,3072,0.013311111264758639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,2048,0.004964444372389051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,2560,0.013426666458447775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,1536,0.004512888689835866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,1024,0.0038853333228164246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,2048,0.012772444221708508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,768,0.0036657779581016968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,1536,0.012426666915416718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,1024,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,768,0.012071111136012606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,256,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,512,0.011407111254003314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,128,0.00258577780591117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,256,0.011411555939250521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,64,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,128,0.010485333700974783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,32,0.002473777780930201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,64,0.011579555769761404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,3584,0.007547555698288812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,32,0.009699555734793345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,65536,0.036193778117497764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,51200,0.02896889050801595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,16384,0.014132445057233175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,2048,3584,0.014176888598336114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,65536,0.05830488602320353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,12288,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,51200,0.04786666565471225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,10240,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,16384,0.023074666659037273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,8192,0.010431999961535135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,7168,0.009666666388511658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,12288,0.02119111186928219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,10240,0.019310222731696237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,6144,0.009727111293209923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,8192,0.016192888220151264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,5120,0.008644444247086843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,4096,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,7168,0.016186666157510545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,2048,512,0.003522666792074839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,6144,0.01536355581548479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,3072,0.006256888724035687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,2560,0.00554577757914861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,5120,0.014741332994567024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,4096,0.013850666582584381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,2048,0.004918222212129169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,3584,0.014126222994592456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,1536,0.004565333326657613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,1024,0.003903111235962974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,3072,0.013461333182122974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,2560,0.01311466677321328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,2048,0.012396444049146442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,1536,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,512,0.0032053333189752367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,1024,0.01239911135700014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,256,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,768,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,128,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,512,0.012084444363911947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,64,0.0024951110697454875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,256,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,32,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,128,0.010739555789364709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,65536,0.02597155504756504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,64,0.011388444238238864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,51200,0.021391999390390184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,65536,0.0555057790544298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,16384,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,51200,0.04534133275349935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,12288,0.011735111474990845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,3584,0.0068986668354935115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,16384,0.021960000197092693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,10240,0.010335110955768162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,8192,0.008821333448092142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,12288,0.019925332731670804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,7168,0.010048000348938836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,10240,0.018231999542978074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,6144,0.008791999684439765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,8192,0.016134222348531086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1536,768,0.0034933334423436057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,5120,0.007641777396202087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,4096,0.00757422215408749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,6144,0.015171556009186639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,3584,0.006911110960774952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,4096,0.013739555246300168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,3072,0.006291555447710886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,3584,0.013872000078360239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,2560,0.005600888695981767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,3072,0.013220444321632385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,2048,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,1536,0.005609777652555042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1536,32,0.010372444159454769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,2560,0.012795555922720166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,1024,0.00453333349691497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,2048,0.012427555190192329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,768,0.0041999999019834726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,512,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,1536,0.012112889024946423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,1024,0.011676444775528379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,768,0.012033777932325998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,512,0.012100444071822695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,256,0.011018666956159802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,64,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,128,0.011049778097205691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,32,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,64,0.010727110836240979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,65536,0.023183110687467787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,7168,0.016174222032229107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,32,0.01035199976629681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,51200,0.019137778215938143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,16384,0.011275555524561139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,1024,5120,0.0147706667582194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,65536,0.0545457767115699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,12288,0.01089244418674045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,51200,0.04482044445143806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,10240,0.00999644481473499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,16384,0.021338666478792827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,8192,0.00831911133395301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,7168,0.009131555755933126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,12288,0.018762666318151686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,10240,0.017878222796652053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,6144,0.00850399997499254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,5120,0.00793688909875022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,8192,0.016509332590632968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,4096,0.007293333609898885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,7168,0.015799111790127225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,3584,0.0069644442862934535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,6144,0.015478221906556023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,5120,0.014501333236694336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,3072,0.006244444598754247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,2560,0.005548444473081165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,4096,0.01402311192618476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,256,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,2048,0.005250666704442766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,3584,0.013807999591032663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,1536,0.0052488889131281115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,3072,0.013070222404268054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,1024,128,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,2560,0.01313333296113544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,768,0.003826666623353958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,2048,0.012064889073371887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,512,0.003474666840500302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,1536,0.01238933371173011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,256,0.0031439999325407874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,1024,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,768,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,512,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,256,0.011406222151385413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,32,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,128,0.01069866700304879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,65536,0.017494221528371174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,64,0.010794666906197866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,768,32,0.011054221954610614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,51200,0.016113777955373127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,16384,0.010100444157918295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,65536,0.05334666702482435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,12288,0.010009778042634329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,51200,0.044008000029457935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,10240,0.009354666703277165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,12288,0.018920888503392536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,8192,0.00816000004609426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,10240,0.017539555827776592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,7168,0.009011555876996782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,8192,0.01648355523745219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,6144,0.008280889027648503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,7168,0.015863110621770222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,5120,0.007654222349325816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,1024,0.004219555606444676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,4096,0.007286222444640265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,6144,0.015488889482286243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,3584,0.00693866651919153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,5120,0.014766222900814481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,768,128,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,3072,0.006613333192136552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,4096,0.013792888985739814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,2560,0.005944889038801193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,3584,0.01383733335468504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,2048,0.005961777849329843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,1536,0.004603555632962121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,3072,0.013117333253224691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,2560,0.01313777764638265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,1024,0.003839111162556542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,768,0.0034808889031410217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,2048,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,1536,0.01237422227859497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,1024,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,768,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,512,0.011930666863918304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,16384,0.02094488839308421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,64,0.002537777854336633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,256,0.010668444136778513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,32,0.002510222295920054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,128,0.011057777537239922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,64,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,65536,0.017332444588343304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,51200,0.014649778604507446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,512,32,0.009370666411187913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,16384,0.009017777939637503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,65536,0.05234044459131029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,51200,0.04110399881998698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,12288,0.008258666429254744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,16384,0.020849777592553034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,10240,0.007308444215191736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,8192,0.0069546666410234236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,12288,0.01828977796766493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,7168,0.006583999842405319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,8192,0.016194666425387066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,6144,0.007279111279381647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,7168,0.015471999843915304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,5120,0.006576889091067844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,512,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,6144,0.01519733336236742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,4096,0.006583999842405319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,3584,0.00602311102880372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,256,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,5120,0.014094221923086377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,3072,0.005935110979610019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,512,128,0.0028560000161329904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,2560,0.006285333385070165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,4096,0.013976888524161445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,2048,0.005984000033802456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,3584,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,1536,0.004209777961174647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,3072,0.012729778057999082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,1024,0.003863111138343811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,2560,0.012854222622182635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,768,0.003536000019974179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,2048,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,512,0.0032026666320032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,1536,0.012568888564904531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,256,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,1024,0.011600000162919363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,128,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,768,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,64,0.0026933333526055017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,512,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,256,32,0.002522666628162066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,256,0.011715555356608497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,65536,0.01479288935661316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,128,0.010002666877375709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,51200,0.01275288893116845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,64,0.011049778097205691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,16384,0.008319999608728621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,32,0.011076444553004371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,12288,0.007644444704055786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,10240,0.007289778027269576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,65536,0.04938755432764689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,51200,0.04039288891686334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,8192,0.006592000110281839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,256,10240,0.017350221673647564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,12288,0.018571555614471436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,7168,0.006575999988449945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,6144,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,10240,0.017856889300876193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,5120,0.00627377794848548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,8192,0.016036444240146212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,4096,0.005565333283609814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,7168,0.015522667103343539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,6144,0.015114666687117683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,3584,0.005944889038801193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,3072,0.005881777654091517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,4096,0.013418667018413544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,2560,0.005535999933878581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,3072,0.013079110946920184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,2048,0.005567111074924469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,2560,0.01279022213485506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,1536,0.004538666870858935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,2048,0.012646222280131446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,1024,0.003673777812057071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,1536,0.011769777370823754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,768,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,1024,0.012039110892348819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,512,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,768,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,256,0.002941333378354708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,512,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,128,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,256,0.010008888940016428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,64,0.002483555633160803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,128,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,128,32,0.0028008888992998335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,64,0.010660444696744284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,5120,0.014501333236694336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,65536,0.011055111057228513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,32,0.011024889018800525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,51200,0.010508444574144153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,16384,0.006623999940024481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,65536,0.04973599976963467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,12288,0.007297777467303806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,51200,0.04073777794837952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,16384,0.02027466727627648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,10240,0.0069297779765393995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,8192,0.006620444357395172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,12288,0.01889155473974016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,7168,0.006584888945023219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,8192,0.01647555496957567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,6144,0.006227555374304454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,5120,0.005613333235184352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,7168,0.01610933409796821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,4096,0.005280888742870755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,6144,0.01480888823668162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,5120,0.014428445034556918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,3584,0.005611555443869696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,16384,0.020637333393096924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,4096,0.014109333356221518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,2560,0.005937777873542573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,3584,0.013753777576817406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,2048,0.005888000130653381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,3072,0.01276266657643848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,1536,0.0041999999019834726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,2560,0.013417777915795645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,1024,0.00387999994887246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,2048,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,768,0.003478222423129611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,1536,0.01204711116022534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,128,3584,0.013746666411558786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,512,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,1024,0.012098666694429187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,256,0.0025884444928831523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,128,0.0025920000755124623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,768,0.012054222325483957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,64,0.002473777780930201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,512,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,256,0.01184177812602785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,32,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,128,0.010403555300500657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,65536,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,51200,0.010407999985747868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,64,0.011592888997660743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,10240,0.017176000608338248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,16384,0.006637333167923822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,12288,0.006970666348934174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,65536,0.04896266592873467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,10240,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,51200,0.04107111030154758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,16384,0.020575111111005146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,8192,0.006646222124497096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,12288,0.018526222970750596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,7168,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,6144,0.006224000205596288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,10240,0.01720355616675483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,8192,0.0159244438012441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,5120,0.00526311124364535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,64,3072,0.005320000151793162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,4096,0.0052666668262746595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,7168,0.015512888630231222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,3584,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,6144,0.015140444040298462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,3072,0.005570666657553778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,5120,0.014095111025704278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,4096,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,3584,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,2048,0.0057848890622456866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,3072,0.013120888835854001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,1536,0.004540444248252445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,2560,0.012726222475369772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,1024,0.0038604442444112566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,2048,0.012434666355450949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,768,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,1536,0.012410666379663678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,512,0.003181333343187968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,1024,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,256,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,768,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,512,0.0120319997270902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,64,32,0.01038933296998342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,256,0.010963555839326648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,64,0.0028560000161329904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,32,0.002512000087234709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,64,0.0103511114915212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,32,0.010451555252075195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,2560,0.005714666512277391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,51200,0.49580886628892684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,9,32,128,0.002847111059559716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,51200,1.0224231084187825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,16384,0.3423475424448649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,9,32,128,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,16384,0.17075378364986846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,12288,0.18861156039767793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,12288,0.24612177742852104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,10240,0.20613333914015028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,10240,0.14708356062571207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,8192,0.15444444285498724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,8192,0.13541689183976915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,7168,0.13330045011308458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,7168,0.10099733538097805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,10240,0.12782133950127497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,12288,0.14750577343834773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,6144,0.11479289001888698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,6144,0.09071377913157146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,8192,0.11073866817686294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,5120,0.09649333026674058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,16384,0.19008089436425102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,5120,0.08133777644899157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,7168,0.09767999913957383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,4096,0.08020710945129395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,3584,0.0687662230597602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,4096,0.06639733579423693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,3584,0.06543199883566962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,3072,0.05968266725540161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,4096,0.06662933031717937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,5120,0.07842044697867499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,6144,0.08817333645290798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,3584,0.06314755810631646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,2560,0.050422221422195435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,3072,0.05702400207519531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,2048,0.04142755601141188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,2560,0.0456853343380822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,1536,0.03223199976815118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,2048,0.03985244366857741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,2560,0.051811556021372475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,1536,0.03151199883884854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,1024,0.02356622285313076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,1024,0.023615999354256526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,1536,0.041914665036731295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,768,0.018830221560266282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,768,0.022280888424979314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,1024,0.03794044587347243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,768,0.032878223392698504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,512,0.0136808885468377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,256,0.008163555628723567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,512,0.029699554045995075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,512,0.019242667489581637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,256,0.015631111131774057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,256,0.025568000144428674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,64,0.00590133335855272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,128,0.020761777957280476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,128,0.01440622243616316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,32,0.00555288874440723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,64,0.015454222758611044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,65536,32,0.015351111690203348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,3072,0.057272891203562416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,2048,0.04737777842415703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,65536,0.523180431789822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,65536,51200,0.5203564431932237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,65536,0.9725866317749023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,51200,0.3995369010501438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,65536,128,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,51200,0.7502560085720487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,16384,0.2519964377085368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,12288,0.19420711199442545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,10240,0.16291911072201198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,16384,0.1388604508505927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,12288,0.1225866609149509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,10240,0.1363697714275784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,8192,0.11447200510236953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,7168,0.12279378043280707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,7168,0.08284088638093737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,10240,0.10576355457305908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,16384,0.1569546726014879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,12288,0.12086489465501572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,6144,0.10337155395083958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,8192,0.09273599916034275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,6144,0.0787022246254815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,5120,0.09041066964467366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,5120,0.06588266955481635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,8192,0.1388346619076199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,4096,0.07190755340788099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,7168,0.08252711428536309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,4096,0.054901334974500865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,3584,0.06302933560477363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,6144,0.07393155495325725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,5120,0.06703911225001018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,3072,0.055677334467569985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,3584,0.04942399925655789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,2560,0.046852442953321666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,3072,0.044341332382626004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,4096,0.059678223397996694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,3584,0.05596444341871473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,2048,0.03785599933730231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,2560,0.03850133220354716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,3072,0.050845334927241005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,1536,0.029791110091739233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,2048,0.033081776565975614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,2560,0.04749511016739739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,1024,0.021014221840434607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,1536,0.02752444479200575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,2048,0.045087112320793994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,768,0.015835555063353646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,1536,0.036983999941084124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,1024,0.02145511077509986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,512,0.011501332951916588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,1024,0.03437155485153198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,256,0.007245333658324347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,768,0.020765332712067496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,512,0.017551110850440133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,128,0.0038924444880750445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,256,0.01421688828203413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,256,0.025193777349260118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,64,0.0033857776886887024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,128,0.013497778111033969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,128,0.02109777761830224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,51200,32,0.003488000068399641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,64,0.01458755632241567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,51200,32,0.013478221992651621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,65536,0.3242071204715305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,65536,0.18246489100986055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,51200,0.2516453266143799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,51200,0.4135048919253879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,51200,0.14022844367557102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,16384,0.08700444300969441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,768,0.02938577863905165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,16384,0.056608001391092934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,12288,0.06772089004516602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,12288,0.0567457808388604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,10240,0.05499022205670675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,12288,0.058339556058247886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,65536,0.534786648220486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,16384,0.06986133257548015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,8192,0.042760888735453285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,10240,0.049808889627456665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,7168,0.037654221057891846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,8192,0.04652355445755852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,10240,0.05324088864856296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,7168,0.04049244523048401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,6144,0.032673776149749756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,8192,0.05021244287490845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,5120,0.028004444307751123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,7168,0.04525244567129347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,6144,0.03654133280118307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,65536,0.1949004464679294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,4096,0.024118221468395654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,6144,0.043215112553702466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,5120,0.03236533204714457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,3584,0.020638222495714825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,51200,0.16204710801442465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,4096,0.027060444156328838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,4096,0.036200887627071805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,3584,0.03378222386042277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,3072,0.018365333477656048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,3072,0.023927110764715407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,2560,0.015783111254374187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,5120,0.03944089015324911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,3584,0.025128000312381323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,3072,0.03282399972279867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,2560,0.02127555509408315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,2560,0.030768000417285498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,1536,0.011026666396194033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,2048,0.029861334297392104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,1024,0.008349333372380998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,2048,0.01867644488811493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,768,0.006912888752089606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,1536,0.026724444495307073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,1536,0.017072000437312655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,1024,0.026426666312747534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,512,0.00489066665371259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,1024,0.014211555322011312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,256,0.003272888975010978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,768,0.013789333403110504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,512,0.022978666755888198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,512,0.013432000246312885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,128,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,256,0.02129688858985901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,128,0.011427555647161273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,128,0.019186667270130582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,64,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,51200,512,0.02849777870708042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,32,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,64,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,32,0.011193777951929303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,65536,0.24648443857828775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,65536,0.15795821613735622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,16384,2048,0.013447110851605734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,51200,0.19053867128160265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,51200,0.12151200241512722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,16384,0.06686933173073663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,16384,768,0.023356444305843774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,16384,0.049399111005995006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,12288,0.05202133456865946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,16384,256,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,10240,0.04469866553942362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,12288,0.04659822252061632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,16384,0.06090222464667427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,10240,0.04413777920934889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,8192,0.03683733277850681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,10240,0.04657333427005344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,8192,0.039008888933393694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,7168,0.032607999112870954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,51200,0.12306222650739883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,8192,0.04447111156251696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,6144,0.028759111960728962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,65536,0.1535822285546197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,7168,0.040629333919949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,5120,0.025086222423447505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,6144,0.0343537794219123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,4096,0.021988444858127173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,6144,0.03839288817511664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,5120,0.02868710954984029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,5120,0.03496711121665107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,3584,0.01959111127588484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,4096,0.025756445195939805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,4096,0.03268622358640035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,3072,0.01759022143152025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,3584,0.023306666149033442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,3584,0.03135822216669718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,3072,0.03092355529467265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,2560,0.015453333655993143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,3072,0.022449778185950384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,2048,0.013329777452680798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,2560,0.019925332731670804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,2560,0.029177778297000464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,1536,0.008886222210195329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,2048,0.01851466629240248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,2048,0.028436445527606543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,12288,0.05073688758744133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,1024,0.007260444263617198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,768,0.005717333406209946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,1536,0.02604266670015123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,1536,0.017512889371977914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,1024,0.023077333966890972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,1024,0.014124444789356656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,768,0.02125155594613817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,768,0.013463999662134381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,256,0.0032026666320032547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,512,0.022300443715519373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,512,0.012317332956526013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,128,0.0028684443483750024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,7168,0.0362684428691864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,256,0.020643555455737643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,256,0.01148622234662374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,64,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,32,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,12288,128,0.02026844521363576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,128,0.011013333168294696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,64,0.011384000380833944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,12288,32,0.011395555403497485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,65536,0.20703021685282388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,51200,0.16285955905914307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,65536,0.14952266216278076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,51200,0.11653155750698513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,16384,0.05923910935719808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,16384,0.047725333107842334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,12288,0.04428177740838793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,12288,0.047447111871507436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,16384,0.05416622095637851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,10240,0.03812888926929898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,12288,0.047888888253106006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,12288,512,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,8192,0.031581332286198936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,10240,0.03872088922394647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,8192,0.033655110332700945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,7168,0.028696888022952612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,10240,0.04477777745988634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,8192,0.04173600011401706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,6144,0.02574488851759169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,51200,0.10961600144704182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,7168,0.03014933400683933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,5120,0.022387555903858606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,6144,0.028370665179358587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,7168,0.03911555475658841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,6144,0.03619822197490268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,5120,0.025376889440748427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,5120,0.033879998657438494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,3584,0.017500445246696472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,4096,0.03144266539149814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,3072,0.015650666422314115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,3584,0.02090311050415039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,3584,0.03065955638885498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,2560,0.01402666668097178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,3072,0.030159112479951646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,3072,0.0203813330994712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,2048,0.01036000003417333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,2560,0.01854933301607768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,2560,0.028781334559122723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,1536,0.009015111459626092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,2048,0.017082666357358296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,2048,0.027518222729365032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,1024,0.006457777900828256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,1536,0.016024889217482675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,1536,0.025389333566029865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,768,0.005552000055710475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,1024,0.013428444663683573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,1024,0.02200088898340861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,512,0.003924444317817688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,768,0.012770666844315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,65536,0.13559556007385254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,256,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,512,0.02075377768940396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,4096,0.019466666711701285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,128,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,256,0.011207111179828644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,256,0.020613332589467365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,64,0.0030862221287356485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,128,0.018730666902330186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,128,0.011375111010339526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,10240,32,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,64,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,32,0.011428444749779172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,65536,0.17133688926696777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,65536,0.09940977891286214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,51200,0.12962399588690862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,51200,0.07824355363845825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,16384,0.04552622305022346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,10240,768,0.02165599995189243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,16384,0.036277333895365395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,512,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,12288,0.032815112007988825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,10240,4096,0.02270222206910451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,16384,0.053278221024407275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,12288,0.034527109728919134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,65536,0.1278266641828749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,51200,0.10476889212926228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,10240,0.027515555421511333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,8192,0.023740443918440077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,12288,0.04621600111325582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,10240,0.0321777794096205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,7168,0.02038666605949402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,10240,0.04269955555597941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,8192,0.027783112393485174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,6144,0.018225777480337355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,8192,0.04020533296797011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,5120,0.015785778562227886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,7168,0.02477866742346022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,7168,0.03707289033465915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,4096,0.013763555222087435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,6144,0.02276533345381419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,5120,0.021609778205553692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,5120,0.03426577647527059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,4096,0.01960088809331258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,4096,0.03104089034928216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,3072,0.011003555523024665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,3584,0.03119644522666931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,3584,0.01888088881969452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,2560,0.009300444689061906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,3072,0.028944889704386394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,3072,0.01753155555990007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,2048,0.008279110822412703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,2560,0.017095110482639737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,1536,0.0070773329999711775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,2048,0.027173333697848853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,2048,0.015271110667122735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,1024,0.005930666708283954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,1536,0.01443555619981554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,1536,0.023181334137916565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,768,0.0041644444896115195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,1024,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,1024,0.02309333284695943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,512,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,768,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,768,0.021290666527218286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,256,0.0031351111829280853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,512,0.021314667330847845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,256,0.010993777877754636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,6144,0.035628444618648954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,256,0.0210524449745814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,3584,0.01178311142656538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,64,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,128,0.0188755558596717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,128,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,32,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,64,0.011086222198274402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,32,0.01033688916100396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,8192,2560,0.029393778906928167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,65536,0.14850489298502603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,65536,0.09266933467653062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,51200,0.1177546713087294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,51200,0.07188266515731812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,16384,0.041478223270840116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,8192,512,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,16384,0.034259554412629865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,12288,0.03334044416745504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,8192,128,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,65536,0.12690667311350504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,12288,0.033222221665912204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,16384,0.05316533313857185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,10240,0.028488887680901423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,12288,0.04620888829231262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,8192,0.024280889166726008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,51200,0.10459555519951715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,7168,0.018894222047593858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,10240,0.029459555943806965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,10240,0.042656888564427696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,6144,0.016528000434239704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,8192,0.038995554049809776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,8192,0.02631644407908122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,7168,0.02363377809524536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,5120,0.01443822185198466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,7168,0.037215110328462385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,4096,0.012711111042234631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,6144,0.03501155641343858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,3584,0.010832000109884473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,5120,0.02128977742460039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,5120,0.03275110986497667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,4096,0.03080000148879157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,4096,0.01925066610177358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,3072,0.010144888526863521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,2560,0.008783111141787635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,3584,0.030954665607876245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,3584,0.01789955629242791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,3072,0.029613332615958318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,3072,0.01719377769364251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,2560,0.016521778371598985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,2560,0.02938666608598497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,1536,0.006602666858169768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,2048,0.026480888326962788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,2048,0.014783999986118741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,1024,0.004515555583768421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,1536,0.013818666338920593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,768,0.0041857775714662345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,1024,0.021553777986102637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,1024,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,512,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,768,0.02126755482620663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,512,0.011422221859296164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,256,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,512,0.02090488870938619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,256,0.020568889048364427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,256,0.010694222317801582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,128,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,6144,0.022967111733224656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,64,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,128,0.01032977799574534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,32,0.00254133323000537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,64,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,7168,2048,0.007983110845088959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,32,0.010482666393121084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,65536,0.1227137777540419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,65536,0.0861591100692749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,1536,0.024021334118313257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,51200,0.06566488742828369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,7168,768,0.01277599980433782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,16384,0.03512710995144314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,16384,0.03148266673088074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,12288,0.028831998507181805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,16384,0.05221244361665514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,51200,0.10532710949579875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,12288,0.030857778257793848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,7168,128,0.018586667047606576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,10240,0.024806222981876794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,12288,0.045272890064451426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,8192,0.021372444099850122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,10240,0.03017066584693061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,10240,0.04169688953293694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,8192,0.02569866677125295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,7168,0.019140443868107267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,8192,0.0396088891559177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,6144,0.01684177749686771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,7168,0.02271733350223965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,7168,0.036328001154793635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,6144,0.021737777524524268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,6144,0.035599999957614474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,4096,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,5120,0.033032887511783175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,5120,0.01978488928741879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,3584,0.010261333651012844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,4096,0.031594667169782854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,4096,0.018560000591807894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,3072,0.008983111215962304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,3584,0.017364444004164804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,3584,0.029891557163662378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,2560,0.008293333152929941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,3072,0.029608001311620075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,3072,0.016737777325842116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,2048,0.007281777759393056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,65536,0.1255626678466797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,2048,0.014115555418862237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,1536,0.0063884444534778595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,2048,0.02648888859483931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,1536,0.0240000006225374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,1536,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,1024,0.004243555582231945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,1024,0.02162133322821723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,1024,0.012713777522246042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,768,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,5120,0.015256888336605497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,512,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,768,0.021984888447655573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,768,0.012441777520709567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,256,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,512,0.020642666353119742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,512,0.011573333707120685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,128,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,256,0.011373333632946014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,256,0.020591111646758187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,128,0.020350222786267597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,128,0.010674667027261523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,32,0.0025155554629034465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,2560,0.015460444821251763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,64,0.011019555230935415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,6144,32,0.010039110978444418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,65536,0.10629066493776108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,51200,0.08495377831988865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,65536,0.07584533426496717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,16384,0.0321324434545305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,51200,0.06050755580266317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,16384,0.029523554775449965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,12288,0.02591288917594486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,16384,0.05180977781613668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,6144,51200,0.0964168906211853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,12288,0.02944177720281813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,10240,0.02204977803760105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,51200,0.10445333189434475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,12288,0.04527733392185635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,8192,0.019654222660594516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,10240,0.027064889669418335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,8192,0.023982221881548565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,7168,0.017265778448846605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,8192,0.03839377893341912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,10240,0.041526221566730075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,6144,0.015544000599119397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,7168,0.022280888424979314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,6144,2560,0.028853333658642236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,5120,0.01383733335468504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,6144,0.034527109728919134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,6144,0.021543110410372417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,4096,0.010810666614108615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,5120,0.03353155652681986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,4096,0.018353778454992507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,3584,0.009299555586444007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,3584,0.030397332376903955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,3584,0.01721600029203627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,3072,0.008433777425024245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,3072,0.01625333395269182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,2560,0.007947555846638149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,65536,0.12549777825673422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,2560,0.014847111370828418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,2560,0.027294221851560805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,2048,0.006853333363930385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,1536,0.005432888865470886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,2048,0.025013332565625507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,2048,0.01369866645998425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,1024,0.0041831110914548235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,1536,0.012560000022252401
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,7168,0.035981333918041654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,1536,0.023359111613697473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,768,0.0038613333470291565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,1024,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,1024,0.022421333524915908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,512,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,768,0.012450666891203986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,256,0.0028782222006056043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,5120,0.019557333654827543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,4096,0.03042844600147671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,512,0.020920889245139226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,128,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,256,0.022299556268586054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,64,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,128,0.010327999790509542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,5120,32,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,64,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,32,0.010344888601038191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,65536,0.09270222319497003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,65536,0.07089244657092623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,51200,0.06708533234066434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,51200,0.05573599868350559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,65536,0.12607822153303358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,768,0.02128177715672387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,16384,0.02648888859483931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,12288,0.02070844504568312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,512,0.011035555766688453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,16384,0.02719288898838891
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,5120,256,0.011385777758227454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,16384,0.04999022351370918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,10240,0.01844888925552368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,128,0.018583999739752877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,12288,0.026957333087921143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,8192,0.016064888901180692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,51200,0.10393777820799087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,12288,0.044080889887279935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,7168,0.014392889208263822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,5120,3072,0.030361778206295435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,10240,0.04151644309361776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,8192,0.02292266653643714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,6144,0.013408888545301227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,5120,0.01197866681549284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,7168,0.020901333954599168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,7168,0.03599111239115397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,6144,0.020587555236286588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,4096,0.010776888993051318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,6144,0.03388977713055081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,3584,0.011378666592968835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,5120,0.032623112201690674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,5120,0.0185253338681327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,4096,0.030829333596759375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,4096,0.01752355529202355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,3584,0.02949955397182041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,3584,0.01711466742886437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,2560,0.009315555294354757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,3072,0.015119110544522604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,3072,0.02699111070897844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,2048,0.008254222571849823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,2560,0.013935999737845527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,2560,0.026328888204362657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,1536,0.005947555518812603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,2048,0.013772444592581855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,2048,0.02398577829202016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,1024,0.004874666531880696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,1536,0.02331999937693278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,768,0.004518222063779831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,1024,0.022964444425370958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,1024,0.01202933324707879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,512,0.0038542221817705366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,768,0.012090666426552666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,768,0.022451554735501606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,256,0.0029768887907266617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,512,0.01148444414138794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,512,0.021327111456129286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,128,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,8192,0.03835555579927232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,256,0.011348444554540845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,256,0.020304888486862183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,64,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,32,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,4096,128,0.018582221534517076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,128,0.010524444282054901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,64,0.010850666297806634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,65536,0.07957333326339722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,4096,3072,0.010276444256305695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,65536,0.06707644462585449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,51200,0.05432800120777554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,16384,0.024319110645188227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,65536,0.12496977382236057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,1536,0.012464889221721225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,16384,0.02529688841766781
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,12288,0.019428445233239066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,16384,0.05002489023738437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,12288,0.043952001465691455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,10240,0.016826666063732572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,12288,0.025409777959187824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,8192,0.014498665928840637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,10240,0.02569155560599433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,10240,0.04094488753212823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,7168,0.013242666920026144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,8192,0.021425777011447485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,8192,0.03798844416936239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,6144,0.012096888489193387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,7168,0.02075822154680888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,7168,0.03686844309171041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,5120,0.011124444504578909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,6144,0.019496000475353666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,51200,0.06189066833919949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,6144,0.033893333541022405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,4096,0.010265777508417765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,5120,0.01816177699300978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,5120,0.032582223415374756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,3584,0.010817777779367236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,4096,0.01685422162214915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,4096,0.029839111698998347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,3072,0.009621333744790819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,3584,0.016031111280123394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,3584,0.02832711074087355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,2560,0.00830844458606508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,3072,0.026719111535284255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,3072,0.01442577772670322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,2048,0.007080888582600488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,51200,0.10418666733635797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,1536,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,2560,0.025363556212849084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,2048,0.023984889189402264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,1536,0.022985777921146814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,1536,0.01238044434123569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,1024,0.004916444420814514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,10240,0.023637332850032385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,1024,0.01204177737236023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,768,0.00424177779091729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,768,0.021288888321982488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,768,0.012070222033394707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,512,0.0035546666218174826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,4096,32,0.010355555348926121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,512,0.02096533278624217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,512,0.011066666907734342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,256,0.010689777632554373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,128,0.0028026666906144884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,128,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,2560,0.013796444568369122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,64,0.002584888910253843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,2048,0.012880889077981314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,32,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,64,0.011694221860832639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3584,32,0.010016000105275048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,1024,0.02234488891230689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,65536,0.06342666678958468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,51200,0.05071466830041674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,65536,0.06429421901702881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3584,256,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,51200,0.05237955517239041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,16384,0.020672000116772123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,65536,0.12501333819495306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,256,0.02125066684352027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,16384,0.024724443753560383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,12288,0.01737777723206414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,51200,0.10384711292054917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,10240,0.015099555253982544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,16384,0.05136977632840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,8192,0.01311288856797748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,12288,0.025062221619817946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,12288,0.04446488949987623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,10240,0.041005333264668785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,10240,0.022966222630606756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,7168,0.012379555238617791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,8192,0.020408888657887776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,6144,0.011355555719799466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,8192,0.03780711028310988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3584,128,0.01865244408448537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,7168,0.035402665535608925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,6144,0.03476000163290236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,6144,0.018381334013409086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,4096,0.009644444617960189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,5120,0.017501332693629794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,5120,0.032440887557135686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,3584,0.009298666483826106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,4096,0.029492444462246362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,4096,0.01516711049609714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,3072,0.008709333009190029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,3584,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,3584,0.0273973329199685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,2560,0.007939555578761632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,3072,0.02682311170630985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,3072,0.014115555418862237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,2560,0.025036444266637165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,2560,0.013707555830478668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,1536,0.006240889016124938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,2048,0.0236453331179089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,1536,0.01240888900227017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,1024,0.00519822206762102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,1024,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,1024,0.02164799968401591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,768,0.004538666870858935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,5120,0.01032266683048672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,768,0.021956443786621094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,768,0.011422221859296164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,512,0.003913777983850903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,512,0.01107377807299296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,256,0.0035128887328836652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,2048,0.006582222051090664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,256,0.010727110836240979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,128,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,2048,0.0129120002190272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,256,0.021898667017618816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,64,0.0025315555847353404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,128,0.010381333529949188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,1536,0.022618666291236877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,3072,32,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,128,0.020247111717859905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,64,0.011071110765139261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,65536,0.05749333567089505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,32,0.009720000127951304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,65536,0.06212800078921848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,3072,7168,0.01984444426165687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,51200,0.05059911145104302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,16384,0.019080888893869188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,65536,0.12543022632598877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,16384,0.024143111374643113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,12288,0.015496888094478183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,16384,0.049192888869179614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,10240,0.013788444300492605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,3072,512,0.021503999829292297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,12288,0.04480977853139242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,8192,0.011804444094498953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,10240,0.04082755578888787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,10240,0.02142133315404256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,8192,0.03769333495034112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,8192,0.01959733333852556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,7168,0.010998222563001843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,6144,0.010421333213647207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,7168,0.03604266709751553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,51200,0.04470577836036682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,6144,0.03376444511943393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,6144,0.018025777406162687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,5120,0.009663110805882348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,4096,0.00925333301226298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,5120,0.0332293344868554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,4096,0.01443911095460256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,3584,0.008629333641793992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,4096,0.028621332512961492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,51200,0.104001780351003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,3072,0.008288000192907121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,3584,0.013766222529941134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,12288,0.02299822204642826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,2560,0.0069004446268081665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,3072,0.013815110756291283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,2560,0.013246222502655454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,2560,0.026382222771644592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,2048,0.005892444401979446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,2048,0.012915555801656512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,2048,0.023689778314696416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,7168,0.018938667244381376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,1536,0.0055440002017551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,1024,0.004572444491916233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,1536,0.023303111394246418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,1536,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,1024,0.012255999777052136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,1024,0.02234577801492479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,5120,0.015531554818153381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,512,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,768,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,768,0.021948445174429152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,256,0.0031840000301599503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,512,0.02232711182700263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,3584,0.02754488918516371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,256,0.010695111420419482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,128,0.0028497777465316984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,256,0.021612443857722815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,64,0.0027991111079851785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,3072,0.02571288910177019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,128,0.01035377797153261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2560,128,0.02019999921321869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,32,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,65536,0.05125688844256931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,64,0.011729777687125735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,32,0.010348444183667501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,51200,0.03868800070550706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,65536,0.06031022469202677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,16384,0.01589777734544542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,51200,0.04933155576388041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,16384,0.023491554790072974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,65536,0.1257457733154297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,12288,0.013062222136391534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,51200,0.10388266377978855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,16384,0.04955200023121304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,10240,0.01163111130396525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2560,768,0.0041742221348815495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,8192,0.011177777416176267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,12288,0.043734222650527954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,10240,0.020579554968410067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,7168,0.01089866707722346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,8192,0.03752711084153917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2560,512,0.011030221978823343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,7168,0.03429333368937174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,7168,0.017282666431532968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,6144,0.033210668298933245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,6144,0.01661155621210734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,5120,0.008743999732865227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,5120,0.03122488988770379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,4096,0.010718222293588849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,4096,0.01421333352724711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,4096,0.029176000091764662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,3584,0.010037333601050908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,12288,0.02197066611713833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,3072,0.006598222172922558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,3584,0.013929777675204806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,10240,0.041787554820378624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,2560,0.00590133335855272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,3584,0.027106665902667578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,8192,0.0196079992585712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,3072,0.02609777781698439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,3072,0.013783111340469785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,2560,0.02513422237502204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,2560,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,6144,0.010116444693671333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,1536,0.005951111101441913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,2048,0.024705777565638225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,1024,0.004862222406599256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,2048,0.012730666332774691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,768,0.004176889028814104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,1536,0.022996443841192458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,1536,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,1024,0.02167644434505039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,512,0.0035333335399627686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,1024,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,768,0.02204799983236525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,768,0.011737777955002256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,5120,0.015174221661355762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,512,0.022295110755496558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,512,0.011305777562989129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,128,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,256,0.010689777632554373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,256,0.020594666401545208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,64,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,128,0.0103502223889033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,32,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,2048,128,0.01993600030740102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,65536,0.036538667149013944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,64,0.011027555498811932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,2048,32,0.01032977799574534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,65536,0.05838133229149712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,51200,0.04795644349522061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,65536,0.12469600306616889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,16384,0.013615111509958902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,51200,0.10431644651624893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,2048,0.006815111057625876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,12288,0.011328000161382886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,16384,0.022967999180157978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,16384,0.049250665638181895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,10240,0.010377777947319878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,12288,0.02083822256988949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,8192,0.010321777727868822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,10240,0.01977155605951945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,10240,0.04072711202833388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,7168,0.009341333475377824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,8192,0.016511999898486666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,2048,256,0.0032302221904198327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,7168,0.016381333271662395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,7168,0.033933334880405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,6144,0.015238222148683337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,6144,0.03251466817326016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,5120,0.007667555577225155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,51200,0.029057777590221826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,5120,0.029612445169025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,5120,0.014711999230914645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,4096,0.027427555786238775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,4096,0.013759111364682516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,3584,0.007280888656775157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,3584,0.013760888742076026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,3584,0.02674666709370083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,3072,0.00656088896923595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,12288,0.04514133267932468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,3072,0.013391999734772576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,2560,0.005631111148330901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,3072,0.026429333620601233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,2048,0.005952000204059813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,2560,0.025760889053344727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,2560,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,8192,0.0362737774848938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,1536,0.005208888815508948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,2048,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,6144,0.008678221868144141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,1024,0.0042071110672420925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,2048,0.025056888659795124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,768,0.0038684445122877755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,1536,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,1024,0.02197155521975623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,1024,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,512,0.0033777778347333274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,768,0.02199555602338579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,768,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,256,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,512,0.0207004447778066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,512,0.011050666371981302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,128,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,4096,0.007636444436179266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,256,0.021007999777793884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,64,0.002528000002106031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1536,32,0.0025457777082920074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,128,0.0192284451590644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,128,0.01035911093155543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,64,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,32,0.009862222605281407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,51200,0.021307556165589228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,65536,0.05602666404512194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,65536,0.12516178025139704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,51200,0.045087112320793994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,16384,0.01443911095460256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,51200,0.10270222028096516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,12288,0.01257599973016315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,16384,0.04898222287495931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,16384,0.022069333328141108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,10240,0.011685333318180509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,12288,0.019541333119074505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,12288,0.04227466715706719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1536,1536,0.02232711182700263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,8192,0.010379555324713389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,10240,0.017853332890404593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,10240,0.03936000002755059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,7168,0.009886222581068674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,8192,0.03617066807217068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,8192,0.016169778174824186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,6144,0.00869511150651508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,7168,0.03326311045222812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,7168,0.015808888607554965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,5120,0.00777688870827357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1536,256,0.011404444773991903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,6144,0.03116977877087063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,4096,0.007319110963079665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,5120,0.01459822224246131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,4096,0.013822221921549903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,3584,0.006907555378145642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,4096,0.02808800008561876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,3584,0.01370133293999566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,3584,0.026721777187453374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,3072,0.0063075555695427795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,3072,0.013071999781661563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,3072,0.025769778423839148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,2560,0.005605333381228977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,2560,0.012723555167516073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,2560,0.025399999486075506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,2048,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,2048,0.012445333103338877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,1536,0.005675555517276128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,6144,0.015140444040298462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,1536,0.011744000017642975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,1024,0.004519999855094486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,1536,0.023318222827381555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,768,0.003863111138343811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,65536,0.025777777036031086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,1024,0.021599110629823472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,1024,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,512,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,768,0.012067555553383298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,768,0.02157955533928341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,256,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,512,0.02037333283159468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,128,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,256,0.01034577770365609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,128,0.01071111112833023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,64,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,128,0.018578666779730055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,1024,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,64,0.011030221978823343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,32,0.010048888623714447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,65536,0.021703999903466966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,2048,0.024359110328886244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,51200,0.018180444836616516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,65536,0.05339822173118591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,65536,0.12454844845665826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,16384,0.01036444471942054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,51200,0.044531553983688354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,51200,0.10263644324408637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,5120,0.030990223089853924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,12288,0.010993777877754636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,16384,0.02163999941613939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,16384,0.048912889427608915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,10240,0.01015733347998725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,12288,0.04163466559516059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,12288,0.018911111685964797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,8192,0.008972444468074376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,1024,512,0.011018666956159802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,10240,0.01755644381046295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,7168,0.00868800034125646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,1024,256,0.021614222062958613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,8192,0.03458755546145969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,8192,0.01651022169325087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,6144,0.008293333152929941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,7168,0.033462223079469465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,7168,0.015799999237060547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,6144,0.03258488906754388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,6144,0.01511111193233066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,4096,0.007296000089910295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,5120,0.029579556650585596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,5120,0.014442667365074158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,3584,0.007260444263617198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,4096,0.02843466732237074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,3072,0.006969778074158563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,3584,0.02676888969209459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,3072,0.013435555828942193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,2560,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,2560,0.013103110922707452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,2560,0.02572711143228743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,2048,0.005245333330498801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,10240,0.037680887513690524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,2048,0.012763555679056378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,1536,0.0052373334765434265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,5120,0.006973333656787872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,1536,0.012432888978057437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,1536,0.023022222850057814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,4096,0.013753777576817406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,1024,0.012042666474978128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,3584,0.013434666726324292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,768,0.0035502223504914176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,1024,0.02160088883505927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,512,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,3072,0.02613777750068241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,768,0.022343110707071092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,768,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,256,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,512,0.021219554874632094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,128,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,256,0.02125955621401469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,256,0.010512000156773461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,128,0.0105262224872907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,128,0.01956266661485036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,32,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,65536,0.017504000001483493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,64,0.011013333168294696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,768,2048,0.023638221952650283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,32,0.01071466671095954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,51200,0.01499111122555203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,65536,0.05323288838068644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,16384,0.010620444185203977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,65536,0.1251493295033773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,51200,0.04379111197259691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,12288,0.008730666504965888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,16384,0.020986666282018025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,16384,0.04823288983768887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,10240,0.007896000312434303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,12288,0.018575999471876357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,12288,0.04108177622159322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,8192,0.00794400026400884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,10240,0.017646221650971305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,10240,0.03906666570239597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,7168,0.00794222205877304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,8192,0.035960889524883695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,8192,0.016196444630622864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,6144,0.007266666326257918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,7168,0.015843555331230164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,7168,0.033944000800450645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,5120,0.006919999917348226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,6144,0.015249777171346875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,6144,0.03230311142073737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,4096,0.0069226668112807805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,5120,0.029469334416919287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,4096,0.013760888742076026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,4096,0.02809244394302368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,3584,0.0069102222720781965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,3584,0.02774222195148468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,768,1024,0.0042239998777707415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,3584,0.013497778111033969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,3072,0.006339555399285422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,51200,0.10229155752393936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,2560,0.006412444429265128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,3072,0.02602400051222907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,3072,0.013443555268976422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,2048,0.005944889038801193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,2560,0.02621511121590932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,2560,0.012716444830099741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,1536,0.004569777597983678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,2048,0.023787554767396715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,1024,0.003858666867017746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,1536,0.011765333513418833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,1536,0.02367288867632548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,768,0.003559999995761447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,768,512,0.011077333655622272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,1024,0.021314667330847845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,1024,0.011410666836632622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,512,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,768,0.02131555477778117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,768,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,256,0.0031475555151700974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,512,0.020625778370433383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,512,0.01090311093462838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,128,0.0028702221396896574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,256,0.020064888728989493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,256,0.011100444528791638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,64,0.002524444419476721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,512,32,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,512,128,0.0185217774576611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,65536,0.015033778217103748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,64,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,32,0.010009778042634329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,51200,0.013183111117945777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,65536,0.050683554675843984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,65536,0.12349066469404434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,16384,0.008655110994974772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,51200,0.04179288943608602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,12288,0.008277333445019191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,51200,0.10116799672444661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,16384,0.02090311050415039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,16384,0.047275556458367236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,10240,0.007630222373538547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,2048,0.012759110993809171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,12288,0.04109155469470554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,8192,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,10240,0.039408889081743025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,10240,0.017468444175190397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,7168,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,8192,0.015875554747051664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,8192,0.036321779092152916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,6144,0.006632888896597757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,7168,0.015474667151769003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,7168,0.03456977672047085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,5120,0.005961777849329843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,6144,0.03119644522666931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,6144,0.01514755520555708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,4096,0.005783111270931032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,5120,0.014719999498791166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,5120,0.030140442980660334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,3584,0.006252444452709622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,5120,0.014735110931926303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,4096,0.014003554979960123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,4096,0.027106665902667578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,3072,0.005937777873542573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,3584,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,3584,0.027506666051016912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,2560,0.006224888894293044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,3072,0.013088888592190213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,3072,0.026748443643252056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,2048,0.006031111296680238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,2560,0.024393777052561443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,2560,0.012763555679056378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,1536,0.004528000122971005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,2048,0.023364444573720295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,2048,0.012747555143303342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,1024,0.0038275557259718576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,1536,0.022335999541812476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,768,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,1024,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,1024,0.021581333544519212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,12288,0.018407111366589863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,512,0.0031519999934567344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,768,0.01107911103301578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,256,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,768,0.022650667362742957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,512,0.02057066725360023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,512,0.01074044406414032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,128,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,256,0.021949332621362474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,256,0.010701333483060202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,64,0.0024906665914588505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,256,128,0.018573333819707234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,128,0.010008888940016428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,65536,0.014096000128322177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,64,0.010683555569913654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,32,0.009371555513805812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,51200,0.012788444757461548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,512,128,0.0103502223889033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,65536,0.04891733328501383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,16384,0.007663999994595845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,65536,0.122871994972229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,51200,0.040371557076772056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,51200,0.1004248857498169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,12288,0.006978666616810693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,16384,0.047558221552107066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,16384,0.02052533295419481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,10240,0.0069226668112807805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,12288,0.018538667096032035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,10240,0.01721333298418257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,8192,0.006699555450015598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,10240,0.037639111280441284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,7168,0.006578666468461354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,8192,0.03491910960939195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,8192,0.015864888827006023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,6144,0.005959110955397288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,7168,0.03326933251486884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,6144,0.01478666729397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,5120,0.005565333283609814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,6144,0.031184001101387873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,256,32,0.0025066667132907445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,4096,0.005922666854328579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,5120,0.014160000615649752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,5120,0.029531555043326482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,3584,0.0058986664646201665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,4096,0.014078223043017916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,4096,0.027793778313530818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,3072,0.005550222264395819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,3584,0.013410666750537025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,3584,0.027782221635182697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,2560,0.005952000204059813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,3072,0.02569155560599433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,3072,0.012457778056462606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,2048,0.005568000177542369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,2560,0.013271999855836233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,12288,0.04109333289994134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,1536,0.004403555558787452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,2048,0.012067555553383298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,1536,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,1024,0.003830222205983268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,1536,0.022361778550677832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,7168,0.015489778584904142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,768,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,1024,0.021363554729355708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,1024,0.011395555403497485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,512,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,768,0.011411555939250521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,768,0.02125777800877889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,256,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,512,0.02056711084312863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,256,0.009983110758993361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,256,0.020586666133668687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,128,0.00253866674999396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,128,0.017215111189418368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,128,0.010654222634103564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,128,32,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,64,0.010682666467295753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,65536,0.010391111175219217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,32,0.010004444254769219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,256,1536,0.012503110700183444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,51200,0.009351111120647853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,2048,0.024706666668256123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,16384,0.007298666569921706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,51200,0.04071288969781663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,12288,0.006274666637182236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,16384,0.021298666795094807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,10240,0.006263111200597551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,12288,0.018522666560279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,8192,0.006275555739800136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,10240,0.017553778158293832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,128,512,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,7168,0.006615110983451207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,6144,0.00591822216908137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,5120,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,7168,0.015127110812399121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,6144,0.01513155632548862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,4096,0.005379555539952383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,3584,0.005586666779385672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,5120,0.014472888575659858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,3072,0.005271111097600725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,4096,0.014148443937301636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,2560,0.006246222390068903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,3072,0.012783110969596438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,2048,0.005594666633341048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,8,128,2560,0.025386666258176167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,2560,0.013110222087966071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,1536,0.004249777644872665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,1024,0.0037093332244290244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,65536,0.04862844281726413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,2048,0.012040889097584618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,1536,0.012440000143316058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,512,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,1024,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,256,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,768,0.011065777805116443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,128,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,512,0.011756444142924415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,64,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,256,0.010344888601038191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,32,0.002540444541308615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,128,0.01035199976629681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,64,0.01142133358452055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,8192,0.016175111134847004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,32,0.010016889207892949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,51200,0.008667555948098501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,16384,0.006280888699822956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,65536,0.049534221490224205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,51200,0.04054666558901469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,12288,0.006623111251327727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,10240,0.006258666515350342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,16384,0.020917332834667627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,64,3584,0.013111111190583972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,8192,0.005535999933878581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,12288,0.01854222185081906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,7168,0.006133333262470033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,10240,0.017539555827776592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,6144,0.005935110979610019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,5120,0.0059004442559348206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,8192,0.015861334072219003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,7168,0.01552177800072564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,4096,0.005249777601824866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,6144,0.015171556009186639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,3584,0.005464000006516774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,5120,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,64,768,0.00342755557762252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,4096,0.013624889155228933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,2560,0.005568888866239124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,3584,0.013762666947311826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,2048,0.0052586665583981415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,3072,0.013259555730554791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,1536,0.0041848888827694785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,1024,0.003559111307064692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,2560,0.012210666305489011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,768,0.0031715554909573663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,2048,0.012739555703269111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,512,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,1536,0.012439111040698158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,1024,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,256,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,128,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,65536,0.008977777428097194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,64,0.0024702221983008915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,512,0.011747555600272285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,32,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,256,0.010404444403118556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,128,0.010728889041476779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,64,0.011032889286677042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,32,0.010370666782061258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,16384,0.21898933251698813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,16384,0.34024887614780003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,8,32,3072,0.005594666633341048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,51200,0.4953902032640245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,12288,0.2612977822621663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,12288,0.15837332937452528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,10240,0.2046764426761203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,10240,0.13709421952565512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,8192,0.1536853313446045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,51200,1.0168693330552843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,7168,0.1333120001686944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,8,32,768,0.011352000137170156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,8192,0.12600444422827825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,6144,0.11494310696919759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,7168,0.10964800251854791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,5120,0.0964862240685357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,4096,0.08019910918341742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,5120,0.08388888835906982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,3584,0.06944355699751112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,3072,0.0600186652607388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,4096,0.06840978066126506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,2560,0.051256000995635986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,6144,0.09412622451782227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,2048,0.042005333635542125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,3584,0.06136977672576904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,1536,0.03302133414480422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,3072,0.05460000038146973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,2048,0.04390133420626322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,1024,0.023510222633679707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,1536,0.035868446032206215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,1024,0.02665688925319248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,2560,0.046570665306515165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,512,0.013697778185208639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,256,0.008955555657545725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,768,0.023353776997990076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,128,0.006218666831652324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,512,0.01886755559179518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,64,0.005589333259397083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,32,0.0058782220714622075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,256,0.016858667135238647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,64,0.01516266663869222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,128,0.014434667097197639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,65536,32,0.015127999915017022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,51200,0.3988453282250299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,65536,0.519886228773329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,65536,768,0.018758222460746765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,51200,0.7528053389655219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,16384,0.25196888711717397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,65536,0.9703270594278971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,12288,0.1931377781762017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,16384,0.18107999695671928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,8192,0.14143910672929552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,10240,0.1622355514102512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,10240,0.10947910944620769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,8192,0.09882399770948623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,12288,0.13004799683888754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,5120,0.08939733107884724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,5120,0.07046044535107084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,4096,0.07297955618964301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,6144,0.07687644163767497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,3584,0.06318666537602742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,4096,0.06454310814539592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,3072,0.05537777807977465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,3584,0.05039288931422763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,2560,0.047472887569003634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,3072,0.04658755660057068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,2048,0.037920888927247785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,2560,0.0400622222158644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,1536,0.02978488802909851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,1024,0.021459556288189355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,2048,0.038324445486068726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,1536,0.030080888006422255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,768,0.015824889143308003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,1024,0.0236151119073232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,512,0.01127466642194324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,256,0.007373332977294922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,7168,0.12512444125281438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,6144,0.10629422134823269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,768,0.021008888880411785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,128,0.0038702223036024305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,512,0.018038221531444125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,64,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,256,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,51200,32,0.003479111111826367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,64,0.014205333259370593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,32,0.014144889182514615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,128,0.013896889156765409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,51200,7168,0.08455910947587754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,16384,0.08741511238945855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,65536,0.18360800213283965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,65536,0.3230222331153022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,51200,0.2502817842695448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,16384,0.07439466979768541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,51200,0.14012800322638616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,10240,0.055027554432551064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,8192,0.043807999955283276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,7168,0.03776266508632236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,12288,0.05901333358552721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,6144,0.03274755676587423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,8192,0.044682668315039746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,10240,0.047129776742723256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,7168,0.038557334078682795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,5120,0.02822222312291463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,4096,0.023670223024156358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,3584,0.02072533302836948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,6144,0.03929333223236932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,3072,0.018445332845052082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,5120,0.03290044599109226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,2560,0.016002666619088914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,4096,0.027451554934183758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,2560,0.021402666966120403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,3584,0.024682665864626568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,3072,0.023430221610599097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,1536,0.010833777487277985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,1024,0.008340444829728868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,1536,0.018094221750895183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,768,0.00702400008837382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,1024,0.016146666473812528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,512,0.005081777771313985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,768,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,256,0.003530666646030214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,12288,0.06732800271775988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,512,0.013773333695199756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,64,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,256,0.011704000333944956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,32,0.0028248888750871024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,128,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,64,0.01242844429281023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,32,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,65536,0.24702933099534777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,65536,0.1558684508005778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,16384,0.06702488660812378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,16384,2048,0.020604444874657523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,2048,0.01331022216214074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,51200,0.12134310934278701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,12288,0.05168622069888645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,10240,0.04399111204677158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,8192,0.03719377848837111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,16384,0.0610026650958591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,10240,0.043415112627877124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,7168,0.03244355652067397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,6144,0.02937244375546773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,7168,0.03507377703984579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,8192,0.04658044377962748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,5120,0.025200888514518738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,6144,0.0320995549360911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,4096,0.021984888447655573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,3584,0.019685332973798115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,5120,0.02935289012061225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,3072,0.01738577749994066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,4096,0.02513244416978624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,2560,0.015207999282413058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,3072,0.021312889125612047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,2048,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,2560,0.020288000504175823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,51200,0.1903902159796821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,1536,0.008782222039169734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,1024,0.007066667079925537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,2048,0.019663110375404358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,768,0.005895111295912001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,1024,0.014832889040311178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,512,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,768,0.014174222946166992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,256,0.0033484444850020935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,12288,0.04816710948944092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,128,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,512,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,64,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,256,0.012433778080675336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,12288,32,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,128,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,16384,128,0.003141333245568805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,64,0.012086222569147745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,32,0.010869333313571082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,65536,0.20623111724853516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,51200,0.1612479951646593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,65536,0.14937067031860352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,16384,0.05899555815590752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,3584,0.023696889479955036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,12288,0.04383111000061035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,51200,0.11633155081007217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,10240,0.03801688883039687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,8192,0.0318213336997562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,16384,0.05487022134992811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,7168,0.02882044514020284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,10240,0.03591555688116286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,12288,0.040440890524122454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,6144,0.02562933332390255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,8192,0.034196443027920194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,5120,0.02233155568440755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,4096,0.018981332580248516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,7168,0.03029511041111416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,3584,0.0173688895172543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,12288,1536,0.01752088963985443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,3072,0.015488889482286243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,6144,0.027052443888452318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,5120,0.02571733295917511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,4096,0.022307554880777996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,2560,0.014024888475735983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,2048,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,1536,0.008643555144468943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,3584,0.02091644373204973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,1024,0.0063893331421746155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,3072,0.0199306673473782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,768,0.004861333303981357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,512,0.0042133331298828125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,2560,0.018571555614471436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,256,0.0031840000301599503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,128,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,1024,0.013752000199423896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,768,0.012712889247470431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,64,0.0027991111079851785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,512,0.01308444473478529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,10240,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,256,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,128,0.011776888536082374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,64,0.011424000064531961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,32,0.01033155537313885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,65536,0.17172622680664062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,16384,0.045175111956066556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,65536,0.10182755523257786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,51200,0.12859555085500082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,12288,0.03303555647532145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,51200,0.0780151089032491
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,10240,0.027815110153622095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,8192,0.024159111910396155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,16384,0.042302221059799194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,12288,0.03507644600338406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,10240,0.03179733289612664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,7168,0.020326221982638042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,6144,0.018220444520314533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,5120,0.01578044394652049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,8192,0.028466665082507666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,7168,0.02438666588730282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,4096,0.013887999786270989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,6144,0.023676445086797077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,3584,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,3072,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,5120,0.021107556091414556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,4096,0.019319110446506076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,2560,0.009322666459613377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,3584,0.018424888451894123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,2048,0.008287111090289222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,2048,0.018222222725550335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,1536,0.007262222468852997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,2560,0.01715288890732659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,2048,0.01591111057334476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,768,0.003911111089918348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,1024,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,512,0.0034773333205117118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,768,0.012776888906955719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,256,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,512,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,128,0.0028737777223189673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,256,0.011390222443474663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,64,0.0025395556456512874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,128,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,32,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,64,0.011368888947698804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,32,0.010020444790522257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,65536,0.14977778328789607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,65536,0.09224177731408013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,51200,0.11779022216796875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,10240,1536,0.015641777051819693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,8192,1024,0.005573333137565189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,16384,0.041454222467210554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,12288,0.03314133485158285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,51200,0.07163200113508436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,1536,0.014504889647165934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,10240,0.028463999430338543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,16384,0.040630221366882324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,8192,0.024323556158277724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,7168,0.01886577738655938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,12288,0.03527822097142538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,6144,0.016699555847379897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,10240,0.029826667573716905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,8192,0.026564444104830425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,4096,0.013061333033773633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,7168,0.02401155564520094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,3584,0.011304000185595619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,4096,0.01869244376818339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,3072,0.010213333699438307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,3072,0.01705333259370592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,2560,0.008976000050703684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,2560,0.016827555166350473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,2048,0.00793688909875022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,8192,3072,0.01816177699300978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,1536,0.006604444649484422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,2048,0.015117333994971381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,1024,0.004512000001139111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,1536,0.014487110906177096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,768,0.003887999802827835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,1024,0.012747555143303342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,512,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,5120,0.014463999205165438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,256,0.0029288888391521242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,768,0.012796444197495779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,6144,0.02331111166212294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,128,0.0028453332682450614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,512,0.011701333026091257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,64,0.0025191110455327565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,256,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,7168,32,0.002542222125662698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,5120,0.020797333783573575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,3584,0.018204443984561496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,128,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,64,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,65536,0.12217066023084854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,51200,0.09637333287133111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,16384,0.03538399934768677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,51200,0.0657235582669576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,12288,0.028592000404993694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,10240,0.024655110306209985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,8192,0.021201777789327834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,12288,0.03200711144341363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,7168,0.018931556079122756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,10240,0.028142223755518597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,6144,0.016978666186332703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,8192,0.025987555583318073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,5120,0.015152888165579902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,7168,0.023042667243215773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,4096,0.011677333050303988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,6144,0.022294221652878657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,3584,0.01036533299419615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,4096,0.018166222506099276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,3072,0.009291555318567488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,3584,0.017910222212473553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,2560,0.008329778081840938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,3072,0.016499555773205228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,2048,0.0073520003093613525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,2560,0.016152888536453247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,1536,0.006304889089531369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,2048,0.01443199978934394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,1024,0.0042071110672420925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,7168,32,0.010732444624106089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,1536,0.014123555686738757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,768,0.0035422220826148987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,65536,0.08300799793667264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,512,0.003528888854715559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,256,0.003195555466744635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,1024,0.01275111072593265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,16384,0.03776889046033224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,128,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,768,0.01278222186697854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,64,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,512,0.011692444483439127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,6144,32,0.002550222186578645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,256,0.012200888660218982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,128,0.01108977778090371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,64,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,32,0.00999466660949919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,51200,0.08478933572769165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,16384,0.03186400069130792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,65536,0.07723289065890841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,12288,0.025624000363879736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,6144,5120,0.020992888344658747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,10240,0.022335999541812476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,16384,0.035791999763912626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,12288,0.02970400121476915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,8192,0.01956977778010898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,7168,0.017532444662517972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,10240,0.026000888811217412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,6144,0.01576622161600325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,5120,0.013764444324705334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,8192,0.024753777517212763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,7168,0.022271111607551575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,4096,0.011162666810883416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,6144,0.02240177823437585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,3584,0.00965244405799442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,3072,0.00852711084816191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,5120,0.01993955506218804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,2560,0.007714666426181793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,4096,0.01812177730931176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,3584,0.01706044375896454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,2048,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,3072,0.01591022147072686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,1536,0.005180444568395615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,1024,0.0039057777159743835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,2560,0.01482222146458096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,768,0.003527111063400904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,2048,0.014185777968830533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,512,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,1536,0.013432888521088494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,1024,0.01240799989965227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,256,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,128,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,768,0.012483555409643384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,64,0.0028782222006056043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,256,0.011353777514563667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,65536,0.10675911108652751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,5120,32,0.002530666689078013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,128,0.01108000013563368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,64,0.01145866678820716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,65536,0.09115733040703668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,51200,0.06049955553478665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,51200,0.06681866778267755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,32,0.009639999932712978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,16384,0.026385777526431616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,65536,0.06848533285988702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,12288,0.020642666353119742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,10240,0.018183110488785636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,8192,0.016177778442700703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,51200,0.05550666650136312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,16384,0.03454666667514377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,12288,0.02798844377199809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,7168,0.01443199978934394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,10240,0.02479377720091078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,6144,0.013354666531085968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,5120,0.012063110868136087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,8192,0.02365155518054962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,4096,0.010687111152542962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,7168,0.021242666575643752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,3584,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,6144,0.019873778025309246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,5120,0.018911111685964797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,3072,0.010324444207880232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,4096,0.017267554998397827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,2560,0.008990222381220924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,3584,0.01646844380431705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,2048,0.007985778152942657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,1536,0.007306666837798224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,3072,0.014455111490355598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,2560,0.014420444766680399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,2048,0.014119111829333834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,768,0.004908444566859139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,1536,0.013051555388503604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,512,0.0041706665522522396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,1024,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,256,0.0031822222388452957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,768,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,128,0.0028897778441508612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,512,0.011392888923486074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,256,0.011030221978823343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,32,0.0028026666906144884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,128,0.011733333269755045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,64,0.010999999940395355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,65536,0.08099289072884454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,4096,32,0.010010666317409938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,51200,0.061436441209581166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,16384,0.02416444487041897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,65536,0.0661333335770501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,51200,0.053857776853773326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,12288,0.019088000059127808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,10240,0.01685244507259793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,16384,0.03291199935807122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,8192,0.014753777119848462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,10240,0.02369155486424764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,7168,0.013574221895800697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,4096,1024,0.004947555561860402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,6144,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,7168,0.01993688941001892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,5120,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,5120,512,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,6144,0.019928889142142404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,4096,0.010023111270533668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,3584,0.011337777806652917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,5120,0.018183110488785636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,3072,0.009651555783218807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,2560,0.008623110751310984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,4096,0.016775111357371014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,3584,0.015238222148683337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,2048,0.006968888971540663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,1536,0.005577777822812398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,2560,0.01443911095460256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,1024,0.004873777843183941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,2048,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,768,0.004468444320890638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,1536,0.01313777764638265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,512,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,1024,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,256,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,768,0.012238221863905588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,128,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,512,0.011758222348160215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,64,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,256,0.011956444217099084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,12288,0.027076444692081873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3584,32,0.002581333327624533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,128,0.011744889120260874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,64,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,65536,0.06320710976918538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,8192,0.0229768885506524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,51200,0.050781332784228854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,16384,0.020593777298927307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,65536,0.06445688671535917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,12288,0.01721955504682329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,51200,0.05231111248334249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,10240,0.0151591118839052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,16384,0.030192000998391047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,8192,0.013179555535316467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,7168,0.012390221986505719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,12288,0.025433777107132807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,6144,0.011392888923486074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,10240,0.02256977723704444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,8192,0.021659556362364028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,5120,0.010336000058386061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,4096,0.009771555662155151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,3072,0.013743999931547375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,3584,0.009336888790130615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,5120,0.01791466606987847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,4096,0.015105777316623263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,3072,0.009336888790130615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,2560,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,3584,0.014888889259762235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,3072,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,2048,0.006278222219811545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,2560,0.014105778601434497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,1536,0.006221333311663733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,1024,0.004912888838185204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,2048,0.013208000196350945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,1536,0.013083555632167392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,1024,0.011807999677128263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3584,32,0.01000533335738712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,512,0.004204444587230682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,512,0.011433777709801992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,256,0.0035573335157500375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,7168,0.019560888409614563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,256,0.011042666931947073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,128,0.0031511110977994073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,6144,0.018391110830836825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,64,0.0025191110455327565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,32,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,128,0.01107022249036365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,64,0.01146133326821857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,65536,0.057020445664723717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,32,0.010399111443095738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,51200,0.04478933413823446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,16384,0.01886044442653656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,65536,0.0619608892334832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,51200,0.05072888731956482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,12288,0.01536177761024899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,3072,768,0.00423200014564726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,16384,0.028075555960337322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,8192,0.012033777932325998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,7168,0.01129244433508979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,12288,0.024551999237802293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,10240,0.021662222014533147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,6144,0.01036444471942054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,5120,0.009827555881606208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,8192,0.02028622229894002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,4096,0.009317333499590555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,6144,0.016935111747847665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,5120,0.016262221667501662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,4096,0.01479555500878228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,3072,0.007986666427718269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,3584,0.014692443940374585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,2560,0.007152888509962294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,3072,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,2048,0.006005333529578314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,2560,0.013788444300492605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,1536,0.006098666538794835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,2048,0.012499555945396423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,1024,0.004856889032655292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,1536,0.01310222182008955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,768,0.0042364444169733255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,1024,0.011574221981896294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,512,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,10240,0.0136808885468377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,768,0.012141333685980903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,512,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,3072,768,0.011882666912343768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,128,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,64,0.002647111192345619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,256,0.011799111134476133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,7168,0.019094222121768527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,32,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,128,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,65536,0.04969955484072367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,3584,0.008778666456540426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,51200,0.03848888807826572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,32,0.010001777774757808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,16384,0.015876443849669564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,12288,0.012949333422713809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,65536,0.05981333388222588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,51200,0.049157334698571094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,10240,0.011681777735551199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,16384,0.025072889195548162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,8192,0.011364444262451597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,7168,0.010400888820489248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,12288,0.022455111145973206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,6144,0.009957333405812582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,8192,0.01921333372592926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,5120,0.00925422211488088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,7168,0.01718577742576599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,4096,0.010885333021481832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,6144,0.015820443630218506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,3584,0.009568000005351173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,5120,0.014785778191354541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,3072,0.006572444405820634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,4096,0.014448000325096978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,3584,0.014151111245155334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2560,256,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,3072,0.013406222065289816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,2048,0.006451555424266391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,1536,0.005551110953092575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,2560,0.013434666726324292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,1024,0.004554666578769684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,2048,0.012998222476906247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,768,0.003937777959638172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,1024,0.01236355553070704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,512,0.003536888708670934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,768,0.012075555821259817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,256,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,512,0.012097777591811286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,128,0.0028942223224374983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,256,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,64,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,10240,0.02121688922246297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,128,0.011791110866599612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,64,0.011081777513027191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,65536,0.0361057784822252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,32,0.010384889112578498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,2560,0.005947555518812603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,65536,0.057950225141313344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,51200,0.02903644575013055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,16384,0.01296266665061315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,51200,0.04753511150677999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,12288,0.011228444675604502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2048,1536,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,16384,0.024336889386177063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,10240,0.010449777874681683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,2560,64,0.01069777790043089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,8192,0.01035822182893753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,12288,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,7168,0.009697777529557547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,6144,0.009011555876996782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,10240,0.019320888651741874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,5120,0.007624000310897827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,8192,0.01682133310370975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,4096,0.007319110963079665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,7168,0.01588088936275906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,6144,0.015166223049163818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,3584,0.006996444529957241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,3072,0.006315555423498154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,5120,0.014507555299335055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,2560,0.0058906666106647914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,4096,0.013940445250935025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,2048,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,2048,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,1536,0.004921777794758479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,1024,0.004239999999602635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,2560,0.01312711089849472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,768,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,2048,0.01261333293384976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,1536,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,512,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,256,0.0031786666562159858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,1024,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,128,0.0028702221396896574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,768,0.01181422256761127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,512,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,64,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1536,32,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,256,0.011126221881972419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,128,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,65536,0.02569777766863505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,64,0.010732444624106089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,51200,0.021524444222450256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,32,0.01019022199842665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,16384,0.014893333117167154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,12288,0.0123831108212471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,65536,0.05505955550405714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,51200,0.045151111152437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,10240,0.011576000187132092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,16384,0.022591999835438196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,8192,0.010671111444632212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,12288,0.019713777634832595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,7168,0.009472000102202097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,6144,0.008641777767075432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,10240,0.01830844415558709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,8192,0.016326222154829238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,5120,0.007994666695594788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,4096,0.007607111500369177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,7168,0.015809777710172866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,3584,0.006903999795516332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,6144,0.014897776974572076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,5120,0.014491554763582019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,4096,0.013803555733627744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,3584,0.014107555150985718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,2560,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1536,3072,0.013461333182122974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,3584,0.013473778135246701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,2048,0.006574222197135289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,1536,0.005721777677536011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,3072,0.013040888640615674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,1024,0.004583111239804162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,768,0.003903111235962974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,2048,0.012426666915416718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,1536,0.01237777786122428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,512,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,1024,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,256,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,768,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,128,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,64,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,512,0.011428444749779172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,32,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,256,0.011085333095656501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,128,0.011388444238238864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,65536,0.021631111701329548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,64,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,51200,0.017507554756270517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,32,0.009995555712117089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,16384,0.010492444038391113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,12288,0.010767111347781287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,65536,0.053011556466420494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,51200,0.04415111078156365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,10240,0.009665778113736046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,16384,0.021272889441914026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,8192,0.009336888790130615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,12288,0.019102222389645047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,7168,0.008617777791288164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,10240,0.01755822201569875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,8192,0.016180444094869826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,6144,0.007998222278224098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,5120,0.0069511110583941145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,1024,3072,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,4096,0.007600888609886169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,5120,0.01462577780087789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,3584,0.006958222223652734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,4096,0.013467555244763693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,1024,2560,0.013304000099500021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,3072,0.006940444310506185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,2560,0.006248888870080312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,3584,0.013806222213639153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,2048,0.004895110925038655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,3072,0.01312355531586541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,1536,0.005218666460778978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,2560,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,1024,0.0042053332759274375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,1536,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,768,0.0038488888078265717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,1024,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,512,0.0031786666562159858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,768,0.012053333222866058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,256,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,512,0.011095110740926532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,128,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,256,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,7168,0.015740444262822468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,128,0.010868444210953183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,768,32,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,6144,0.015050666199790107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,65536,0.01733688844574822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,64,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,51200,0.014875556031862894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,32,0.009377777576446533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,16384,0.011023999916182624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,12288,0.008641777767075432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,65536,0.05231022172504001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,10240,0.007602666815121968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,16384,0.02100533412562476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,8192,0.008293333152929941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,10240,0.01720888912677765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,768,2048,0.012448000411192576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,7168,0.007643555601437886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,8192,0.016154666741689045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,6144,0.0076248885856734375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,5120,0.0069217777086628815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,4096,0.00759733302725686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,7168,0.015847999188635085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,6144,0.01482399966981676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,5120,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,3072,0.006598222172922558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,4096,0.013391111459996967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,2560,0.006302222195598815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,3584,0.013804444836245643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,2048,0.006015111174848344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,2560,0.012715555727481842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,1536,0.004494222087992562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,2048,0.012210666305489011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,1024,0.0038355555799272326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,1536,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,768,0.003531555748648114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,1024,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,512,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,51200,0.04377422067854139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,768,0.011066666907734342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,256,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,12288,0.0188746667570538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,512,0.01107377807299296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,64,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,256,0.011025778121418424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,32,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,128,0.011375111010339526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,65536,0.016028443972269695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,64,0.01033155537313885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,51200,0.013355555633703867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,32,0.009296000003814697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,3584,0.0069671107663048645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,16384,0.008619555168681675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,12288,0.008275555239783393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,65536,0.05003733436266581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,10240,0.007610666255156199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,51200,0.04089422358406915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,8192,0.0069324444565508105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,512,3072,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,12288,0.018226666582955253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,7168,0.006629333313968446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,10240,0.017849778135617573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,6144,0.0063680000603199005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,5120,0.00601333338353369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,7168,0.015506666567590503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,4096,0.005702222386995952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,6144,0.015182221929232279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,3584,0.0064284445510970215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,5120,0.014101333088344999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,3072,0.005619555711746216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,4096,0.013092444174819522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,2560,0.006079111248254776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,3584,0.014056000444624158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,3072,0.013083555632167392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,512,128,0.0028862222615215513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,2048,0.005919999960396025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,2560,0.012738666600651212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,1536,0.004551110996140374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,1024,0.0038453332251972626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,2048,0.012073777616024017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,768,0.003563555578390757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,1536,0.011733333269755045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,1024,0.011054221954610614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,768,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,256,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,16384,0.020929776959949072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,256,0.01107377807299296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,128,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,64,0.0026293332791990707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,8192,0.015912888778580558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,32,0.0028364445186323593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,64,0.011395555403497485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,65536,0.014409777190950183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,32,0.00924355536699295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,51200,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,65536,0.04903466502825419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,16384,0.007986666427718269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,51200,0.04008888867166307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,12288,0.007320889168315464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,16384,0.020938666330443487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,10240,0.007310222420427535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,12288,0.018212444252438016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,256,512,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,8192,0.006341333190600078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,7168,0.006588444527652528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,10240,0.017539555827776592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,512,0.011074666347768573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,6144,0.006626666833957036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,8192,0.015855999456511605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,5120,0.005945777727497949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,7168,0.015496888094478183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,4096,0.0059368887709246735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,3584,0.006205333189831839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,6144,0.014821334017647637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,3072,0.0058986664646201665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,4096,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,2560,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,3584,0.013735111388895245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,256,128,0.01107022249036365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,2048,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,3072,0.013096888860066732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,1536,0.004512000001139111
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,1024,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,2560,0.012785777449607849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,2048,0.012114666402339935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,768,0.003548444559176763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,512,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,1536,0.0123831108212471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,1024,0.011031111081441244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,256,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,128,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,512,0.011044444309340583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,64,0.002485333424475458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,256,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,128,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,64,0.010399999717871347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,65536,0.01033688916100396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,32,0.010386666489972008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,51200,0.009937778115272522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,65536,0.04858488837877909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,16384,0.006836444553401735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,51200,0.04071022073427836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,12288,0.006303999986913469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,5120,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,10240,0.005953777581453323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,8192,0.006584888945023219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,16384,0.020590222544140287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,7168,0.006256888724035687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,12288,0.018792000081804063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,10240,0.01716444392999013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,6144,0.006592000110281839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,8192,0.016167999969588388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,5120,0.005923555543025334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,4096,0.00563466673096021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,6144,0.014494222071435718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,3584,0.00591822216908137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,4096,0.013794666363133324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,128,768,0.011377777490350934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,3072,0.005913777897755305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,2560,0.006275555739800136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,128,32,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,3072,0.012749333348539142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,2048,0.005550222264395819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,2560,0.013438222308953604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,1536,0.0041928887367248535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,1024,0.0035617777870761026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,2048,0.012151999606026543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,768,0.003524444583389494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,1536,0.012746666868527731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,1024,0.011028444601429833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,512,0.0031946665710873077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,256,0.0029004443850782183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,128,0.0026311110705137253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,768,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,512,0.011063111325105032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,256,0.011032889286677042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,64,0.002471111093958219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,64,32,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,64,0.011024889018800525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,65536,0.009319999979601966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,32,0.009707555174827576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,51200,0.008343111309740279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,7168,0.015467555986510383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,16384,0.006413333531883027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,5120,0.01442488862408532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,12288,0.0062977779242727495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,51200,0.040052443742752075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,10240,0.005728888842794631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,16384,0.020598222812016804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,3584,0.013468444347381592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,8192,0.005548444473081165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,12288,0.018580444984965853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,10240,0.016857778032620747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,6144,0.005636444522274866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,8192,0.015802666544914246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,5120,0.005590222362014983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,7168,0.015807110402319167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,4096,0.005559111220969095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,6144,0.01461155547036065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,3584,0.005552000055710475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,5120,0.014083556003040738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,3072,0.005264889034960005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,4096,0.013794666363133324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,2560,0.006046222315894232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,3584,0.013125333521101209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,2048,0.0052728888889153796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,64,128,0.011022222538789114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,2560,0.013095999757448832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,1536,0.004214222232500712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,1024,0.0035342222286595237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,2048,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,768,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,1536,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,1024,0.011745777395036487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,768,0.011075555450386472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,65536,0.04841777682304382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,256,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,128,0.0026391111314296722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,512,0.01145333300034205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,64,0.0025395556456512874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,256,0.011069333387745751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,32,0.002499555548032125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,128,0.01074222226937612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,64,0.011404444773991903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,32,0.010050666828950247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,16384,0.3393662240770128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,7,32,3072,0.012784000072214337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,51200,0.4952541987101237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,512,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,16384,0.22774489720662436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,12288,0.15955732928382024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,51200,1.0144053565131295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,10240,0.2048808866076999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,10240,0.14378044340345594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,8192,0.1683706707424588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,7,32,7168,0.0059057776298787855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,7168,0.1327706707848443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,6144,0.11495733261108398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,6144,0.09530399905310737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,7168,0.11068355374866062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,5120,0.09672088755501641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,8192,0.14557511276668972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,3584,0.06871200270122953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,4096,0.07982310983869764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,5120,0.0816497802734375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,3072,0.06057866414388021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,3584,0.061054223113589816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,2560,0.05074933171272278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,2048,0.04241866535610623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,3072,0.05781155824661255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,12288,0.25921956698099774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,2048,0.03899822301334805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,1024,0.023577777875794306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,2560,0.05136355426576403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,768,0.018497778309716117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,1536,0.03581155671013726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,512,0.013601777454217276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,256,0.008647110727098253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,768,0.0229111115137736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,512,0.018532445033391316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,128,0.006574222197135289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,64,0.005606222069925732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,256,0.016473778420024447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,1024,0.027106665902667578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,32,0.005881777654091517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,64,0.014832889040311178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,32,0.01478666729397244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,4096,0.08057244618733723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,65536,1536,0.03243022163709005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,51200,0.3985084427727594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,65536,0.5235715442233616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,51200,0.7480222384134928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,12288,0.19297333558400473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,65536,0.9713004430135092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,16384,0.25108178456624347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,16384,0.155184891488817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,10240,0.16161778238084581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,65536,128,0.01443911095460256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,8192,0.13329154915279812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,10240,0.11353777514563666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,12288,0.13049777348836264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,7168,0.12039466698964436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,5120,0.08791022168265449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,6144,0.10609510872099136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,7168,0.08678666750590007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,6144,0.07994133234024048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,4096,0.07310044765472412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,3584,0.06398133436838786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,8192,0.09832977586322361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,4096,0.06042310926649305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,5120,0.07049777772691515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,2560,0.047360890441470675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,3584,0.050554666254255504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,3072,0.055192000336117215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,2048,0.037801778978771634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,1536,0.029376887612872656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,3072,0.047044446070988975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,1024,0.021120000216695998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,768,0.01591466698381636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,2560,0.04366844561364916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,2048,0.033533334732055664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,1536,0.03087555699878269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,256,0.007292444507280986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,128,0.003934222377008862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,768,0.021589333812395733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,1024,0.023535999986860488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,64,0.0034906665484110513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,256,0.014442667365074158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,32,0.003528888854715559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,128,0.01294222225745519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,64,0.01481244464715322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,32,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,65536,0.3202986717224121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,65536,0.1855706638760037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,51200,0.24972444110446504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,16384,0.08643111255433823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,51200,0.14006488853030735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,12288,0.06678133540683322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,16384,0.06731733348634508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,10240,0.054939554797278516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,8192,0.04393777913517422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,10240,0.05094844433996412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,12288,0.06217688984341092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,8192,0.04361688759591845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,6144,0.032912890116373696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,5120,0.02831733226776123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,7168,0.0400622222158644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,51200,512,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,6144,0.03634044528007507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,4096,0.023980443676312763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,3584,0.02065333392884996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,51200,512,0.017280000779363845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,5120,0.032637334532207914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,3072,0.018271999226676095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,4096,0.02844266759024726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,2560,0.015744000673294067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,2048,0.01310488912794325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,1536,0.010595555934641095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,3072,0.023375999596383836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,2560,0.022117333279715642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,3584,0.025405334101782903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,1024,0.008367111285527548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,2048,0.019840000404251944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,768,0.0069066666894488865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,1536,0.018592000007629395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,256,0.0032177778581778207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,768,0.01444355481200748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,1024,0.01569600072171953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,512,0.013468444347381592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,64,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,256,0.01274577776590983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,32,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,128,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,64,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,16384,32,0.011037333144081963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,7168,0.037308444579442344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,65536,0.24180621571011016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,65536,0.15641155507829455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,16384,0.06640266709857516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,51200,0.1894542243745592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,51200,0.12065688769022624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,12288,0.05161066518889534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,16384,0.06178577740987142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,10240,0.04421155651410421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,12288,0.048604445325003735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,8192,0.037054220835367836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,10240,0.044919110006756253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,6144,0.02863822380701701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,8192,0.03906844390763177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,512,0.004852444347408083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,7168,0.0357582237985399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,6144,0.03292355603641934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,3584,0.019488000207477145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,16384,128,0.003080888961752256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,5120,0.027775110469924078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,4096,0.025587555434968736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,3584,0.022523555490705702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,2560,0.015399111641777886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,3072,0.022207111120224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,2048,0.013455111119482251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,2560,0.021032000581423443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,1536,0.008976000050703684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,2048,0.018461333380805123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,1024,0.0070186663005087115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,1536,0.01719199948840671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,768,0.006073777874310811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,1024,0.015038222074508667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,7168,0.03268355462286208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,512,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,768,0.013760888742076026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,256,0.00314666661951277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,128,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,512,0.012893333203262754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,256,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,5120,0.025511110822359722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,32,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,4096,0.022227555513381958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,64,0.010391111175219217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,32,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,3072,0.01735555628935496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,65536,0.20576800240410698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,16384,0.058614220884111196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,51200,0.16167467170291477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,65536,0.14893333117167154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,51200,0.11576622062259251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,12288,0.044102221727371216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,10240,0.03793155484729343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,8192,0.031946665710873075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,12288,0.04158488909403483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,16384,0.055454221036699086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,10240,0.03973777757750617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,7168,0.028929776615566675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,6144,0.0258942229880227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,8192,0.03348355491956075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,5120,0.022296888960732356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,7168,0.03088088830312093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,4096,0.019310222731696237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,6144,0.02695466743575202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,3584,0.017367111312018502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,5120,0.02450399928622776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,3072,0.015659555792808533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,2560,0.014173333843549093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,3584,0.020279111133681405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,2048,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,12288,64,0.0025884444928831523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,3072,0.01995822290579478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,12288,128,0.011717333561844297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,2560,0.01924800044960446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,1024,0.006299555715587404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,2048,0.01704355577627818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,768,0.004646222210592694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,512,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,1024,0.014133334159851074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,768,0.013977777626779346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,512,0.01204533295498954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,128,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,256,0.012461333639091916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,128,0.011016888750924004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,64,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,32,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,64,0.01038577738735411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,32,0.010692444112565784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,65536,0.1701893276638455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,4096,0.02295733326011234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,65536,0.1019235584470961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,51200,0.12866844071282282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,16384,0.04507911205291748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,1536,0.009105777574910058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,51200,0.07794577545589872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,10240,0.02755466600259145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,16384,0.04281422164705065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,10240,1536,0.01536622146765391
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,8192,0.023312888211674158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,12288,0.03567288981543647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,7168,0.020733333296246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,10240,256,0.003134222287270758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,6144,0.018220444520314533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,8192,0.027067555321587458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,10240,0.032631999916500516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,5120,0.01571644511487749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,4096,0.013738666971524557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,7168,0.025063110722435847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,3584,0.011853333148691388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,6144,0.02407199972205692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,3072,0.010860444770918952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,5120,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,4096,0.019509333703253005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,2560,0.009637333452701569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,2048,0.008355555435021719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,3584,0.01869777838389079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,1536,0.007246221933099959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,3072,0.0184897780418396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,1024,0.0052168890833854675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,2560,0.016971555021074083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,2048,0.015391111373901367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,768,0.0038444445365005066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,512,0.003531555748648114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,1536,0.01443733274936676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,1024,0.013449778159459433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,256,0.0031431110368834603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,128,0.002883555574549569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,512,0.011422221859296164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,256,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,32,0.0028000000036425064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,128,0.011747555600272285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,8192,12288,0.03286222285694546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,32,0.010066666536860997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,65536,0.14759200149112278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,51200,0.1172951062520345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,16384,0.0414284434583452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,51200,0.07140711281034681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,65536,0.09120888842476739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,12288,0.032983111010657415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,10240,0.028415110376146104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,16384,0.04271555609173245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,8192,0.024496888120969135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,12288,0.03493600090344747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,7168,0.018757333358128864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,6144,0.016520889268981088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,10240,0.030181331766976252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,8192,0.026741334133678015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,5120,0.0144195556640625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,7168,0.024339555038346186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,4096,0.012658666405412885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,3584,0.011352000137170156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,5120,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,6144,0.023648000425762598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,4096,0.018917333748605516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,3072,0.010027555955780877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,2560,0.008950221869680617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,768,0.012741333080662621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,2048,0.007713778151406183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,3584,0.0185208883550432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,1536,0.00656444455186526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,3072,0.017831999394628737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,1024,0.005197333378924264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,2560,0.01648266613483429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,768,0.003555555724435382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,2048,0.014688000082969666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,512,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,256,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,1536,0.014108444253603617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,1024,0.012667555775907306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,128,0.002855111120475663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,768,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,8192,64,0.011061333119869232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,64,0.0027964444210131965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,512,0.011415999796655444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,256,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,128,0.010710222025712332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,64,0.010748444332016839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,7168,32,0.010834666589895884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,65536,0.12251999643113877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,16384,0.03540800015131632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,51200,0.0964417788717482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,65536,0.08451910813649495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,12288,0.028845333390765723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,51200,0.06520889202753703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,10240,0.02444533341460758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,16384,0.03866399990187751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,12288,0.03287022312482198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,7168,0.018883556127548218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,10240,0.028522666957643297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,6144,0.017111111018392775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,8192,0.02769600020514594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,5120,0.015119110544522604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,7168,0.023052444060643513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,6144,0.022443556123309668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,5120,0.020283554991086323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,4096,0.018411555223994784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,3072,0.009395555489593083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,3584,0.01755644381046295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,2560,0.008560000194443597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,3072,0.017093333933088515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,2048,0.00723555518521203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,2560,0.015855110353893705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,1536,0.0063475556671619415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,7168,32,0.0027991111079851785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,2048,0.0140364451540841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,1024,0.0038844446341196695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,768,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,1536,0.013817778064144982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,512,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,1024,0.012368888490729861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,256,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,768,0.012755555411179861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,128,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,512,0.011824888487656912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,8192,0.02141777839925554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,256,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,64,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,32,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,128,0.011612444288200803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,64,0.010712888505723743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,6144,32,0.010344888601038191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,65536,0.10681066910425822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,3584,0.010247111320495605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,65536,0.07614488734139337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,51200,0.05988533629311455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,12288,0.025655999779701233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,16384,0.03663555449909634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,10240,0.021885333789719477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,12288,0.031975110371907554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,8192,0.019505777292781405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,7168,0.017246221502621967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,10240,0.027296000056796606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,8192,0.024431111084090337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,6144,0.015395555231306287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,5120,0.014122666584120857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,7168,0.02295555505487654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,4096,0.011167111496130625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,6144,0.02163200080394745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,3584,0.009387555221716562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,5120,0.01957244508796268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,3072,0.008789333204428354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,4096,0.018191999859280057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,2560,0.0079297779334916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,3584,0.017121778594122995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,2048,0.006741333338949416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,3072,0.01585244470172458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,6144,4096,0.011703111231327057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,1536,0.0053226666318045715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,1024,0.0038408889538711975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,2560,0.015303111738628812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,768,0.0036071112586392295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,51200,0.08426133129331802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,2048,0.014124444789356656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,512,0.0032177778581778207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,1536,0.013425778183672162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,16384,0.03161155515246921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,256,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,128,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,768,0.012107555237081317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,512,0.011743110915025076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,256,0.011035555766688453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,128,0.011425777441925473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,64,0.01069866700304879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,65536,0.09121333228217231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,32,0.010415111151006486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,51200,0.06667288806703356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,65536,0.06861155562930636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,16384,0.026188444760110643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,51200,0.055340445703930326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,12288,0.020575111111005146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,10240,0.018522666560279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,16384,0.033415112230512835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,8192,0.01588622232278188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,12288,0.03174133433236016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,7168,0.014499555031458536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,10240,0.02678844498263465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,6144,0.013213333156373767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,8192,0.02364088926050398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,5120,0.012079999678664737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,7168,0.02200266718864441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,4096,0.010848888920413123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,6144,0.020863110820452373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,5120,0.018888889087571036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,3584,0.011057777537239922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,3072,0.00997155573632982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,4096,0.01796444422668881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,2560,0.009310222334331935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,3584,0.01551555593808492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,5120,32,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,2048,0.0083155557513237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,3072,0.01513066722287072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,1536,0.005924444645643234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,1024,0.004864888886610667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,2560,0.014797333214018079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,768,0.004229333251714706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,512,0.0038444445365005066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,1536,0.013136000268989138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,1024,0.01275288893116845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,256,0.0031439999325407874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,768,0.012108444339699216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,128,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,512,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,256,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,32,0.0025617778301239014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,128,0.011404444773991903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,64,0.010732444624106089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,65536,0.07908178038067289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,32,0.01038755559258991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,51200,0.061159114042917885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,65536,0.06662755542331271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,16384,0.02421066661675771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,51200,0.05415644579463535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,12288,0.01905155513021681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,10240,0.01683022247420417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,16384,0.03425155414475335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,8192,0.014765333798196582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,12288,0.029867556360032823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,5120,1024,0.012463111016485425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,10240,0.02507200009293026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,7168,0.013460444079505073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,8192,0.024340444140964087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,6144,0.012728888955381183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,5120,0.011351111034552256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,7168,0.02121688922246297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,4096,0.010339555641015371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,4096,2048,0.013779555757840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,6144,0.02040177749262916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,5120,0.017702221870422363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,3584,0.010327111515733931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,3072,0.009318222602208456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,2560,0.008169777691364288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,4096,0.016985777351591323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,4096,64,0.0025173332542181015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,3584,0.015122666954994202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,2048,0.0069413334131240845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,3072,0.014196443888876172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,1536,0.006229333165619109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,1024,0.004893333133724001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,2560,0.014440889159838358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,768,0.004231111043029361
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,2048,0.013439111411571503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,512,0.003567111161020067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,1536,0.012725333372751871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,256,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,128,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,768,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,512,0.011780444118711682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,64,0.002526222210791376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,256,0.01072799993885888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3584,32,0.0025439999169773525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,128,0.011032000184059143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,65536,0.06305244233873156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,64,0.011190222369299995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,32,0.010355555348926121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,51200,0.050844444168938525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,16384,0.020250666472646926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,65536,0.06417422162161933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,51200,0.051959110630883105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,16384,0.030015110969543457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,10240,0.014953777194023132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,8192,0.01309866706530253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,12288,0.02715555495686001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,7168,0.01237155579858356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,10240,0.02382755610677931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,6144,0.011284444067213269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,8192,0.02072177827358246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,5120,0.010455999937322406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,6144,0.01942399972014957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,4096,0.009724444813198512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,5120,0.01670488880740272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,3584,0.00923733330435223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,4096,0.016168889072206285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3584,1024,0.012795555922720166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,3584,0.014483556151390076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,2560,0.007596444752481248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,3072,0.014150222142537435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,2048,0.00628977765639623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,2560,0.013789333403110504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,2048,0.013207111093733044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,12288,0.01717333330048455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,1024,0.004923555586073133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,1536,0.012717333104875354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,768,0.004232888834344016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,512,0.003573333223660787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,1024,0.011962666279739805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,768,0.012095111111799875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,256,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,512,0.011413333316644033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,128,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,64,0.0024888888001441956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,256,0.011354666617181567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,32,0.002540444541308615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,128,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,7168,0.019955555597941082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,64,0.010687111152542962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,65536,0.05675911241107517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,51200,0.044418666097852916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,3072,32,0.010727110836240979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,16384,0.018977777825461496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,65536,0.0619680020544264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,12288,0.01566844516330295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,10240,0.013792888985739814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,51200,0.050613333781560264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,16384,0.027569777435726587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,3072,0.008637333081828224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,8192,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,12288,0.02531822191344367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,6144,0.010658666491508484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,10240,0.02216533323129018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,8192,0.0200284438000785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,5120,0.009572444690598382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,7168,0.019138667318556044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,4096,0.009284444153308868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,3072,1536,0.006303999986913469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,3584,0.008725333544943068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,6144,0.01719555589887831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,3072,0.00813422186507119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,5120,0.015170666906568738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,4096,0.015110222829712762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,2560,0.006979555719428592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,2048,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,3072,0.013427555561065674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,1536,0.005608888963858287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,2560,0.013464888764752282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,1024,0.004536889079544279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,2048,0.013092444174819522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,768,0.004243555582231945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,1536,0.012100444071822695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,512,0.0038613333470291565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,1024,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,256,0.0032791110376516977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,768,0.012118221984969245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,128,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,512,0.01108444482088089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,64,0.0027022223091787765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,256,0.011723555624485016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,32,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,128,0.011690666278203329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,64,0.010400888820489248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,65536,0.05105955402056376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,32,0.010008888940016428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,51200,0.03828888800409105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2560,7168,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,16384,0.015479111009173922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,65536,0.05952711237801445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,51200,0.04902133345603943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,16384,0.0259253333012263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,10240,0.011685333318180509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,12288,0.024331554770469666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2560,3584,0.013832888669437833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,7168,0.010808889236715106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,8192,0.019211555520693462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,6144,0.009716444545321995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,7168,0.017497777938842773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,5120,0.008996444443861643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,6144,0.015860444969601102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,4096,0.010788444843557147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,5120,0.014793778459231058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,3584,0.009359999663299983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,4096,0.014085332552591959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,3072,0.006568888823191325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,3584,0.013786666923099093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,2560,0.006593777901596493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,3072,0.013364444176355997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,2048,0.0069724445541699724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,12288,0.01295111080010732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,2560,0.01312622262371911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,1536,0.005597333527273602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,2048,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,1024,0.004561777744028303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,768,0.003932444585694207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,8192,0.011346666349305047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,1536,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,512,0.003519111209445529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,1024,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,256,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,10240,0.02075111038155026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,768,0.012100444071822695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,64,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,512,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,32,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,256,0.010692444112565784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,128,0.011257777611414591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,65536,0.035804443889194064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,64,0.011042666931947073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,51200,0.028714666763941448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,16384,0.013216888739003075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,65536,0.05744622151056925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,51200,0.047453333934148155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,16384,0.024344000551435683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,10240,0.010404444403118556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,8192,0.01016533292002148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,12288,0.02162222233083513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,7168,0.009670221971140968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,10240,0.019507555498017203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,8192,0.016493333710564505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,7168,0.015928000211715698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,5120,0.007781333393520779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,6144,0.015138667490747241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,4096,0.007316444483068254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,5120,0.014444443914625378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,3584,0.006924444602595435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,4096,0.014059555199411182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,3072,0.006309333360857434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,3584,0.01353422221210268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,2560,0.005669333454635408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,3072,0.01346933344999949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,2048,0.005939555664857228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,2560,0.01275288893116845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,1536,0.005184000151024925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,2048,0.0124195557501581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,12288,0.011337777806652917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,1024,0.004201777693298128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,768,0.0038844446341196695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,1536,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,512,0.003516444315512975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,1024,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,768,0.011740444435013665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,256,0.0028719999310043124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,6144,0.009015999734401703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,512,0.011035555766688453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,128,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,64,0.002550222186578645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,256,0.01124533348613315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1536,32,0.002842666581273079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,128,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,64,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,65536,0.025799110531806946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,51200,0.021185777253574792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1536,32,0.009438222481144799
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,16384,0.015253333581818474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,65536,0.05500533183415731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,12288,0.012103111379676394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,2048,128,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,16384,0.023019555542204116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,10240,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,8192,0.010566222170988718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,12288,0.01940799918439653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,7168,0.009692444569534725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,10240,0.018147556318177115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,2048,32,0.009645333720578088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,6144,0.008470222353935242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,8192,0.016527111331621807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,5120,0.008222222328186035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,4096,0.007324444750944774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,7168,0.015835555063353646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,3584,0.006798222247097228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,6144,0.015095111396577625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,3072,0.006271111054552927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,5120,0.01479644411140018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,4096,0.013821333646774292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,2560,0.0058986664646201665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,2048,0.006284444282452266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,3584,0.013403555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,3072,0.01311822235584259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,1536,0.005264889034960005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,1024,0.004537777768241035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,2560,0.012736000120639801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,2048,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,1536,0.011778666741318174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,1024,0.01178311142656538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,512,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,256,0.0031395554542541504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,768,0.012097777591811286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,128,0.002883555574549569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,512,0.010911111202504901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,256,0.011028444601429833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,32,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,128,0.01110400011142095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,65536,0.021430222524536982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,64,0.01072533345884747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,32,0.009359111388524374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,51200,0.017877333694034152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,16384,0.010370666782061258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,12288,0.01038044442733129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,65536,0.05359199974271986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,10240,0.009710222482681274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,51200,0.04377422067854139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,16384,0.02131555477778117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,8192,0.009202666580677032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,12288,0.018696889281272888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,10240,0.017854221993022494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,6144,0.007999999655617608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,8192,0.016516443755891588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,5120,0.0069306666652361555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,7168,0.01551466683546702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,4096,0.007287999822033777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,6144,0.015487111277050443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,1024,768,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,3584,0.007274666594134436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,5120,0.014534221755133735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,3072,0.006635555376609166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,4096,0.013464888764752282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,2560,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,2048,0.004927999857399198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,3584,0.013154666456911298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,3072,0.013447110851605734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,1536,0.004873777843183941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,2560,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,1024,0.004184000194072723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,768,0.0038657776183552216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,2048,0.012758221891191272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,512,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,1536,0.012424888710180918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,1024,51200,0.04532444477081299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,256,0.0032106666929192017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,128,0.0028524444335036804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,768,0.011706666813956367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,64,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,512,0.011418666276666852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,32,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,256,0.010687111152542962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,128,0.011563555234008364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,65536,0.016943999462657504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,64,0.01000533335738712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,51200,0.014497778481907315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,32,0.009671111073758867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,16384,0.010829333629873065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,65536,0.05302400059170193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,768,7168,0.008974221845467886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,12288,0.00872444444232517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,10240,0.007627555893527136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,16384,0.02129688858985901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,8192,0.008010666403505538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,12288,0.01851377718978458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,7168,0.007993777592976889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,10240,0.017877333694034152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,6144,0.007299555672539606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,8192,0.01649777756796943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,5120,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,7168,0.01551466683546702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,4096,0.007304888632562425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,6144,0.015454222758611044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,3584,0.007269333634111617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,5120,0.014663999279340109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,4096,0.013601777454217276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,3584,0.013444444371594323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,2560,0.006618666566080517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,768,1024,0.01146399974822998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,3072,0.0127697777416971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,2560,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,1536,0.004584889031118817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,2048,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,1024,0.0038444445365005066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,1536,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,768,0.003528000166018804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,1024,0.011352000137170156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,51200,0.0435804459783766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,512,0.0031395554542541504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,256,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,768,0.012100444071822695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,512,0.0107004443804423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,128,0.0030577776746617425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,64,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,256,0.01090222183201048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,32,0.002521777732504739
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,128,0.010684444672531553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,64,0.010693333215183683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,512,32,0.009317333499590555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,51200,0.013215999636385175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,3072,0.00692622239391009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,65536,0.050251556767357715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,16384,0.009024889104896123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,12288,0.008374222450786168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,51200,0.04075555668936835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,512,2048,0.005912888795137405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,16384,0.021292444732454088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,8192,0.007130666739410824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,12288,0.01889955500761668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,7168,0.006730666591061487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,6144,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,10240,0.017287110288937885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,5120,0.00590133335855272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,8192,0.015917332635985482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,7168,0.015984000431166757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,4096,0.005643555687533484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,3584,0.00590844452381134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,5120,0.01440177857875824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,3072,0.005976000179847081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,4096,0.014084445105658637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,2560,0.006294222341643439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,3584,0.013410666750537025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,2048,0.0059057776298787855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,3072,0.013239999612172445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,1536,0.00452888881166776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,2560,0.013080000049538083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,1024,0.003571555432346132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,2048,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,768,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,65536,0.014932443698247274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,1536,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,512,0.0032097777972618737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,256,0.0028844444702068963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,768,0.011415111521879831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,512,0.010748444332016839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,128,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,64,0.002485333424475458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,256,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,32,0.002776888923512565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,256,10240,0.007311111523045435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,128,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,64,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,65536,0.014175999495718213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,32,0.009152889251708984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,16384,0.00795111142926746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,65536,0.04869955446985033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,51200,0.040067556831571795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,12288,0.007145778172545963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,10240,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,16384,0.0207022229830424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,6144,0.015489778584904142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,8192,0.006608888920810487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,12288,0.018238221605618794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,10240,0.017172444197866652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,6144,0.00629066675901413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,8192,0.01627111103799608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,7168,0.015495111544926962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,5120,0.005590222362014983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,6144,0.014550222290886773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,4096,0.005602666487296422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,256,1024,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,3584,0.006245333287451003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,4096,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,3072,0.005541333307822545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,3584,0.013423999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,2560,0.006301333506902059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,51200,0.012448000411192576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,2048,0.005573333137565189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,2560,0.01275111072593265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,1536,0.004559999952713649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,2048,0.011721777419249216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,1024,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,1536,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,7168,0.006274666637182236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,768,0.003544888976547453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,512,0.003208000005947219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,1024,0.011378666592968835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,256,0.0028782222006056043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,768,0.011396444506115384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,128,0.0026062221990691293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,512,0.011064888702498542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,64,0.002483555633160803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,256,0.010743111371994019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,128,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,128,0.010633777413103314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,64,0.010413332945770687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,5120,0.014122666584120857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,51200,0.009644444617960189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,32,0.010287111004193624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,16384,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,65536,0.04892355534765455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,12288,0.006578666468461354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,51200,0.04009688893953959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,16384,0.020623111062579684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,128,3072,0.013086222112178802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,12288,0.018529777725537617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,8192,0.006248000181383557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,10240,0.01719288859102461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,8192,0.016153777639071148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,6144,0.006468444648716185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,7168,0.015280000037617154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,5120,0.005617777920431561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,6144,0.015119110544522604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,4096,0.0058871110280354815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,5120,0.014139556222491793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,3584,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,4096,0.013821333646774292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,3072,0.005917333480384614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,3584,0.013184888495339287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,65536,0.010676444404655032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,2560,0.005883555445406172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,2048,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,3072,0.013148444394270578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,1536,0.004243555582231945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,2560,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,1024,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,2048,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,768,0.003506666670242945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,1536,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,10240,0.005882666756709416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,512,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,1024,0.011331555744012197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,256,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,128,0.002495999965402815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,64,0.002485333424475458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,512,0.010446222292052375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,7168,0.00591111100382275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,64,32,0.002526222210791376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,256,0.011346666349305047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,128,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,65536,0.009299555586444007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,64,0.00965244405799442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,51200,0.008361777497662438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,32,0.009937778115272522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,16384,0.006253333141406377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,12288,0.006236444330877728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,65536,0.04861688945028517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,10240,0.006224888894293044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,8192,0.005565333283609814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,16384,0.02091644373204973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,12288,0.018198221921920776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,7168,0.005946666830115848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,10240,0.017216889394654166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,8192,0.015814221567577787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,5120,0.005229333208666907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,7168,0.015474667151769003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,6144,0.014840889308187695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,5120,0.01408266690042284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,3584,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,4096,0.013759999639458127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,3072,0.00589155571328269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,3584,0.013083555632167392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,2560,0.005625777774386936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,3072,0.01310400002532535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,2048,0.005881777654091517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,64,768,0.011534222298198275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,2560,0.012436444560686747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,1536,0.004520888957712385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,2048,0.012702222499582501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,1024,0.0038693332009845306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,1536,0.011698666546079846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,768,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,51200,0.04003999961747064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,1024,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,512,0.0031386667655573953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,256,0.002509333400262727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,768,0.011067555182509951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,6144,0.005976000179847081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,128,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,64,0.002487999904486868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,256,0.011003555523024665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,32,0.0024951110697454875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,6,32,4096,0.005225777626037598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,64,0.010383110907342698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,32,0.009004444711738164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,16384,0.3379831049177382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,51200,0.49477513631184894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,16384,0.2258115609486898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,12288,0.26012444496154785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,51200,1.0132542716132271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,512,0.011704000333944956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,6,32,128,0.011425777441925473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,12288,0.16002133157518175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,10240,0.21875377496083578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,8192,0.16819466484917533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,7168,0.14642400211758083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,6144,0.11431111229790582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,8192,0.12314755386776394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,10240,0.13550578223334417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,7168,0.11041511429680718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,5120,0.09699466493394639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,6144,0.09489778015348647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,4096,0.08023022280799018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,3584,0.0689635541703966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,3072,0.060759113894568555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,5120,0.08283378018273248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,4096,0.06964800092909071
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,3584,0.062485330634646945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,2048,0.04239822096294827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,1536,0.032630221711264715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,1024,0.02351644469632043
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,3072,0.05885599719153511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,2048,0.04301333427429199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,1536,0.03397866752412584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,1024,0.026727111803160772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,512,0.013518222504191928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,256,0.008646222452322641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,768,0.0232595553000768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,128,0.0064382221963670515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,512,0.019558222757445443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,256,0.01552088889810774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,64,0.005577777822812398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,32,0.005592888842026393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,128,0.013781333135233985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,64,0.014839111102951897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,32,0.01442488862408532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,2560,0.05048977666431003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,65536,2560,0.04540977875391642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,65536,0.5221164491441515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,65536,768,0.018900444110234577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,51200,0.7461511294047037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,65536,0.9662959840562609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,16384,0.25033511055840385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,12288,0.1921395593219333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,16384,0.17356533474392363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,51200,0.39742310841878253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,10240,0.16087822119394937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,8192,0.13253066274854872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,7168,0.11636711491478814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,8192,0.10226844416724311
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,10240,0.10982844564649795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,12288,0.12776711252000597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,6144,0.10514310995737712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,5120,0.08978044324451023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,5120,0.06860622432496813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,4096,0.07103821966383192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,7168,0.08860444360309178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,3584,0.06417244672775269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,3072,0.054563555452558726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,2560,0.046613332298066884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,3584,0.05201155609554715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,4096,0.05918400155173408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,6144,0.08079822195900811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,1536,0.0296106669637892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,2048,0.0378479990694258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,2560,0.03855822152561612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,1024,0.02118844456142849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,768,0.015504888362354703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,2048,0.037236445479922824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,512,0.011115555961926779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,1536,0.03100088900989956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,1024,0.023511999183230933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,256,0.007338666253619724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,128,0.004120888809363048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,768,0.021778666310840186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,512,0.01754399968518151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,64,0.0031866667171319327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,51200,32,0.0034924443397257063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,64,0.014143110977278816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,128,0.013091555900043912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,65536,0.3215413358476427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,65536,0.1846515602535672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,16384,0.08691910902659099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,3072,0.05028888914320204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,51200,0.13892711533440485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,51200,0.2487502098083496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,12288,0.0662284427218967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,16384,0.07884533537758721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,8192,0.04316355453597175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,12288,0.05634399917390612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,10240,0.0487333337465922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,7168,0.03737422161632114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,6144,0.03277777632077535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,8192,0.04933955603175693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,7168,0.039020445611741804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,32,0.013711999687883588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,6144,0.03580977850490146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,4096,0.022994667291641235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,3584,0.02054933375782437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,4096,0.027277333868874445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,3584,0.025401777691311304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,3072,0.018248000078731112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,2560,0.015638222297032673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,3072,0.024549333585633173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,2560,0.020808888806237113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,2048,0.01331999980741077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,1536,0.010820444259378644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,10240,0.055543998877207436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,2048,0.020569778150982328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,1024,0.008339555727110969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,1536,0.018238221605618794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,768,0.006923555499977536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,512,0.005260444349712796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,1024,0.01532977819442749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,256,0.0034293333689371743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,768,0.014838222000333997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,128,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,5120,0.02780888809098138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,64,0.002842666581273079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,256,0.011352889239788055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,512,0.013807111316257052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,16384,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,128,0.012067555553383298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,5120,0.031565331750445895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,64,0.011764444410800934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,16384,32,0.010704889065689512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,51200,0.18878489070468477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,16384,0.06606222523583306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,65536,0.24473333358764648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,65536,0.1547973288430108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,51200,0.1208240058686998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,12288,0.051318221622043185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,10240,0.04401510953903198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,8192,0.03682133224275377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,16384,0.06079644627041287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,12288,0.05014488763279385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,10240,0.045034666856129967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,7168,0.03228888909022013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,6144,0.02865511178970337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,8192,0.04058400127622817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,5120,0.025052444802390203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,4096,0.022090666823916968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,7168,0.03520800007714166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,6144,0.03520888752407498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,5120,0.02872177627351549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,3072,0.017432888348897297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,4096,0.025822222232818604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,3584,0.02365422248840332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,51200,256,0.014170666535695394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,2560,0.02016177773475647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,1536,0.008620444271299574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,1024,0.007276444799370236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,2048,0.01927911076280806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,768,0.0059279998143513995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,1536,0.017849778135617573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,512,0.003560888684458203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,1024,0.014456000592973499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,256,0.00315022220214208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,768,0.014113777213626437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,128,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,512,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,64,0.002534222271707323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,256,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,32,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,128,0.011429333024554782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,64,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,32,0.011026666396194033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,65536,0.20536711480882433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,3584,0.019357333580652874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,51200,0.16187911563449436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,65536,0.1466319958368937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,16384,0.05827733543184069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,12288,0.04389422138532003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,51200,0.11567821767595078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,10240,0.03803999887572394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,12288,3072,0.022859555151727464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,16384,0.05455644594298469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,12288,0.04520000020662943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,8192,0.03131555517514547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,7168,0.02870133188035753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,10240,0.04159288936191135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,8192,0.034338666333092585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,6144,0.02544266647762722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,5120,0.022286223040686712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,7168,0.03132088979085287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,4096,0.019259555472267997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,6144,0.028093334701326158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,3584,0.01750577820671929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,5120,0.024898666474554274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,3072,0.01553066737122006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,2560,0.01442577772670322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,4096,0.023016888234350417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,3584,0.02130577796035343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,2048,0.010201777848932479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,3072,0.020100444555282593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,1536,0.008850666383902231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,1024,0.006575999988449945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,2048,0.01752355529202355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,1536,0.015784000356992085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,1024,0.014264000786675347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,768,0.00463733325401942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,512,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,256,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,768,0.013796444568369122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,512,0.012395555774370829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,2560,0.015252444479200574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,256,0.011790222591824003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,64,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,32,0.002874666617976295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,12288,2048,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,128,0.011391999820868174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,64,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,32,0.010079111489984725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,65536,0.1718133290608724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,51200,0.12882578372955322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,16384,0.0449022220240699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,65536,0.09758222103118896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,12288,0.033033778270085655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,10240,0.027684445182482403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,51200,0.07760889000362821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,8192,0.023527999718983967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,16384,0.04711911082267761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,12288,0.03546222382121616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,7168,0.020495999190542433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,6144,0.0181057784292433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,10240,0.03256977929009332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,8192,0.027752000424597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,5120,0.01571999986966451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,4096,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,7168,0.02608977754910787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,3584,0.011832888755533429
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,6144,0.022967999180157978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,3072,0.011052444577217102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,10240,2560,0.01824355622132619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,5120,0.02126666737927331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,4096,0.019488000207477145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,2048,0.00831200016869439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,3584,0.019130667050679524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,3072,0.017858665850427415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,1536,0.007144889069928064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,2560,0.01683022247420417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,2048,0.015451555450757345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,768,0.0038613333470291565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,512,0.0035013332962989807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,1536,0.014487110906177096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,1024,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,10240,128,0.0028497777465316984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,768,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,128,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,512,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,256,0.011724444727102915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,128,0.010662222074137794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,64,0.011023999916182624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,8192,32,0.010335110955768162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,65536,0.1482951111263699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,51200,0.11693333254920112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,65536,0.09133155478371514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,16384,0.04110577702522278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,12288,0.03288177649180094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,51200,0.0713697804345025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,10240,0.028129776318868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,16384,0.04186222288343641
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,12288,0.03461066550678677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,8192,0.024130667249361675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,7168,0.018665777312384713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,10240,0.030841777722040813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,6144,0.016407110624843173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,8192,0.026755554808510676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,5120,0.014412444498803882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,2560,0.009654222263230218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,7168,0.024711999628278945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,4096,0.01275466630856196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,3584,0.011215111447705163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,6144,0.02330400049686432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,3072,0.01018311083316803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,5120,0.020979555116759405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,1024,0.005214222189452913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,4096,0.018783999813927543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,3584,0.018230222993426852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,2048,0.00796888851457172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,1536,0.006584888945023219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,3072,0.01721155477894677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,8192,256,0.002995555599530538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,2560,0.015973332855436537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,1024,0.004868444469239977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,768,0.003726222034957674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,512,0.003208000005947219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,1536,0.013778666655222574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,1024,0.013096888860066732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,256,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,768,0.012300444145997366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,128,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,64,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,256,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,128,0.0107360002067354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,32,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,64,0.010799110763602786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,65536,0.12270132700602214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,65536,0.08305866850747003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,51200,0.09661244683795506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,16384,0.03547999925083584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,51200,0.06521155436833699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,12288,0.02831288841035631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,16384,0.04211466511090597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,10240,0.02438755498992072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,7168,2560,0.008932444784376357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,8192,0.02126311096880171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,12288,0.033193777004877724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,7168,0.019109333554903667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,10240,0.02777066661251916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,2048,0.015481778317027621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,6144,0.017091555727852713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,8192,0.02576622201336755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,5120,0.01517955627706316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,4096,0.011644444531864591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,7168,0.0236453331179089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,6144,0.02165688905451033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,512,0.011702222128709158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,3584,0.010283555421564314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,3072,0.009296889106432596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,5120,0.020015999674797058
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,2560,0.008379555410808986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,4096,0.018770666586028207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,2048,0.00740622232357661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,3584,0.01789688898457421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,1536,0.006211555666393704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,1024,0.004302222281694412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,2560,0.015278221832381355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,768,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,7168,32,0.010019555687904358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,2048,0.014858666393491956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,512,0.0033191111352708605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,1536,0.013452444639470843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,256,0.002879111096262932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,1024,0.012099555797047086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,128,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,64,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,512,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,6144,32,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,256,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,128,0.010658666491508484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,64,0.010049777726332346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,65536,0.1058737768067254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,32,0.01037688884470198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,51200,0.08456889126035903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,16384,0.031567109955681696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,65536,0.0756124456723531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,12288,0.02567911148071289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,10240,0.021870222356584337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,51200,0.05967999829186333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,16384,0.03668355610635545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,8192,0.019376888871192932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,12288,0.03012266755104065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,7168,0.017126222451527912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,10240,0.02606311109330919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,6144,0.015480889214409722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,5120,0.01384800010257297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,8192,0.024675556355052527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,7168,0.023123555713229712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,4096,0.011008888483047485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,3584,0.009462222456932068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,6144,0.022336888644430373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,3072,0.008555555509196388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,4096,0.01833866702185737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,3072,0.017329777280489605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,2560,0.007978666987684038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,3584,0.017811555001470778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,2048,0.0069671107663048645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,3072,0.016501333978441026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,1536,0.005184000151024925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,1024,0.0038764443662431505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,2560,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,2048,0.013766222529941134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,768,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,6144,768,0.012450666891203986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,1024,0.0120666664507654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,512,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,256,0.0031679999083280563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,768,0.012119111087587146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,128,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,512,0.011642666326628791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,64,0.002526222210791376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,128,0.010748444332016839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,5120,32,0.0024906665914588505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,64,0.010041777458455827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,32,0.009686222506894005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,65536,0.09025066428714329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,51200,0.06679555442598131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,65536,0.06945600112279256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,5120,0.019179556104871962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,51200,0.055383112695482045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,12288,0.020569778150982328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,16384,0.034958223501841225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,10240,0.018437332577175565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,12288,0.028016000986099243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,1536,0.013758222262064615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,8192,0.015821332732836407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,7168,0.014459555347760519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,10240,0.024450666374630396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,6144,0.013407111167907715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,8192,0.022679999470710754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,7168,0.022171555293930903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,5120,0.011981333295504252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,5120,256,0.011025778121418424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,4096,0.010695999695195092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,6144,0.01925511161486308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,3584,0.011316444310877057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,3072,0.010326222413116032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,5120,0.018783999813927543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,4096,0.017519111434618633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,2560,0.009343999955389235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,3584,0.015508444772826301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,2048,0.007874666816658443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,3072,0.015106666419241162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,2560,0.014382221632533602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,2048,0.013970666461520724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,1024,0.005055111315515307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,768,0.00423555572827657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,1536,0.013167111410035027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,512,0.003834666477309333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,16384,0.02630133264594608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,256,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,768,0.012112889024946423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,128,0.002847111059559716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,512,0.011394666300879585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,64,0.0025128889828920364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,256,0.010727110836240979
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,32,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,128,0.01108444482088089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,64,0.009975999593734741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,65536,0.0791226691669888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,32,0.009391999906963771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,51200,0.061011552810668945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,65536,0.06587911314434476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,16384,0.0239991115199195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,12288,0.01903022163444095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,51200,0.05331110954284668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,10240,0.016591999265882704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,16384,0.031162665949927434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,8192,0.014615111880832247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,12288,0.027464000715149775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,10240,0.023944889505704243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,4096,1536,0.005912888795137405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,6144,0.012427555190192329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,7168,0.020503110355801053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,5120,0.011312888728247749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,6144,0.021232888102531433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,4096,1024,0.012430222498046027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,4096,0.010040000081062317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,3584,0.011042666931947073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,5120,0.01716444392999013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,3072,0.009646221995353699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,4096,0.015917332635985482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,2560,0.008674666285514832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,3584,0.015586665934986539
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,2048,0.006592000110281839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,1536,0.005930666708283954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,3072,0.014490667316648694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,2560,0.01391377713945177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,1024,0.004587555511130227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,768,0.0041964443193541635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,2048,0.014139556222491793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,512,0.0038888889054457345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,1024,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,768,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,512,0.012347555822796293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,128,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,256,0.01069155583779017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,64,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,128,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,32,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,8192,0.02164711058139801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,64,0.010407999985747868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,32,0.01035822182893753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,65536,0.06280355321036445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,51200,0.050584889120525785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,65536,0.06423999865849812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,16384,0.020579554968410067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,51200,0.051698668135537036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,16384,0.030076444149017334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,12288,0.017214222086800467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,10240,0.014961777461899651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,12288,0.025789333714379206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3584,1536,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,8192,0.01312711089849472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,7168,0.0123831108212471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,10240,0.02330133318901062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,256,0.002809777855873108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,6144,0.011398221883508893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,8192,0.02102577851878272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,5120,0.010605333579911126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,4096,0.009685333404276106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,7168,0.019838222199016146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,6144,0.017900443739361234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,3584,0.009078222016493479
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,3072,0.008632889224423302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,5120,0.01660711069901784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,4096,0.015776000089115567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3584,7168,0.013390222357379066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,3584,0.014127999544143677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,2048,0.006577777779764599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,3072,0.014111111561457316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,1536,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,1024,0.004864000197913912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,2560,0.013472889032628802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,768,0.004567999806669024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,2048,0.013363555901580386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,1536,0.012736000120639801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,1024,0.011950222154458364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,256,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,768,0.011691555380821228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,128,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,512,0.010800888968838586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,64,0.00254488881263468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,256,0.010695999695195092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,32,0.002487999904486868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,128,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,64,0.01036088913679123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,65536,0.056939555539025195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,3072,32,0.0103493332862854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,51200,0.04432000054253472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,16384,0.018961777289708454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,65536,0.06155733267466227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,12288,0.015496888094478183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,51200,0.04989155464702182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,10240,0.013782222237851886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,16384,0.028157333532969158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,8192,0.012083555261294046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,12288,0.023992000354660883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,7168,0.01124533348613315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,2560,0.007618666523032718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,10240,0.021648888786633808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,6144,0.010375111467308467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,8192,0.019670221540662978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,5120,0.00999022192425198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,4096,0.00908799966176351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,7168,0.01874755488501655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,6144,0.017338666650984023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,3584,0.008622222476535374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,3072,0.00793599999613232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,5120,0.015499555402331881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,3072,512,0.003850666599141227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,2560,0.006636444479227066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,4096,0.014955555399258932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,2048,0.005944889038801193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,3584,0.014105778601434497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,1536,0.005542222410440445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,3072,0.013738666971524557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,1024,0.004849777867396672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,2560,0.013442666994200813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,768,0.004386666748258802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,2048,0.012445333103338877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,512,0.003660444584157732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,1536,0.012488889197508493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,256,0.0031644445326593188
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,1024,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,128,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,768,0.012089778151777057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,64,0.002537777854336633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2560,32,0.002801777794957161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,512,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,128,0.010667555862002902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,65536,0.05024888780381945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,64,0.01070755554570092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,51200,0.038019554482565984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,32,0.010001777774757808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,16384,0.015837333268589444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,12288,0.012898666991127862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,65536,0.059261335266960986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,10240,0.011699555648697747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,51200,0.048730668094423085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,8192,0.011251555548773872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,16384,0.026744888888465032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,7168,0.01071111112833023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,12288,0.023017777336968318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,6144,0.009773333039548662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,10240,0.02121777832508087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,8192,0.018412444326612685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,7168,0.01739022301303016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,4096,0.010168000227875179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,6144,0.016495111915800307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,3584,0.009295110901196798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,5120,0.01480888823668162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,3072,0.006602666858169768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,4096,0.014537778165605334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,2560,0.0058711109062035876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,3584,0.013872000078360239
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,2048,0.006635555376609166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,3072,0.01344622257683012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,1536,0.005659555395444234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,2560,0.013164444102181328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,1024,0.00519466648499171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,2048,0.012522666818565793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,768,0.0041680000722408295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,1536,0.012478222449620565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,512,0.0035297779573334586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,1024,0.011393778026103973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,256,0.0031973332580592898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2560,256,0.011046222514576383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,128,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,512,0.011766222616036734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,64,0.0025191110455327565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,256,0.011003555523024665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,32,0.0028702221396896574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,128,0.011428444749779172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,64,0.011071110765139261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,65536,0.036377777655919395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,32,0.009663999908500248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,51200,0.02870755394299825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,2048,5120,0.009014222357008193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,16384,0.01316088851955202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,12288,0.01129422254032559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,65536,0.05708622270160251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,10240,0.010659555594126383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,51200,0.046851555506388344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,8192,0.010205333431561789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,16384,0.02438933319515652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,7168,0.009705777797434065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,12288,0.021141333712471858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,6144,0.008625778059164682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,10240,0.018937778141763475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,5120,0.00795111142926746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,8192,0.0162435554795795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,4096,0.007321777443091075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,7168,0.015799111790127225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,3584,0.007264888948864407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,6144,0.015133332875039844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,3072,0.006291555447710886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,5120,0.014759999182489185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,2560,0.00563822231358952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,4096,0.013896889156765409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,2048,0.006256000035338932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,3584,0.013775111072593264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,1536,0.005054222212897407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,3072,0.013267555170589022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,1024,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,2560,0.01311377767059538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,768,0.003906666818592283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,512,0.0035004446076022256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,2048,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,1536,0.012470222181744046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,256,0.0031840000301599503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,2048,768,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,768,0.012105777859687805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,64,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,512,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,256,0.010919111470381418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,32,0.00286666676402092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,128,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,65536,0.02550933261712392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,64,0.011063111325105032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,51200,0.02124622298611535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,32,0.009325332939624786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,16384,0.014497778481907315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,12288,0.012412444584899478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,65536,0.05500177873505486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,10240,0.01201600001917945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,51200,0.04435555471314324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,16384,0.023023999399609033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,8192,0.010384000009960597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,12288,0.019167110323905945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,7168,0.009357333183288574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,6144,0.009001777403884465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,10240,0.017747556169827778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,8192,0.01614488826857673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,5120,0.007985778152942657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,7168,0.015824889143308003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,4096,0.007276444799370236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,3584,0.0069155556460221606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,5120,0.014113777213626437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,3072,0.006573333508438534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,3584,0.013532444834709167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,2560,0.005882666756709416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,3072,0.013139555851618448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,2560,0.013089777694808112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1536,1024,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1536,128,0.0028106667515304354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,2048,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,1536,0.005643555687533484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,1024,0.004863111095296012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,2048,0.01239999963177575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,1536,0.012057777908113269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,768,0.004579555657174853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,1024,0.011378666592968835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,512,0.0035573335157500375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,256,0.0032213332338465583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,768,0.011715555356608497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,128,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,512,0.011341333389282227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,64,0.002805333377586471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,256,0.010848888920413123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,1024,32,0.0027840000887711844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,128,0.011037333144081963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,64,0.009696000152164036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,65536,0.021495110458797876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,32,0.010064000056849586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,51200,0.01776711146036784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,6144,0.015169777803950839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,16384,0.010283555421564314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,12288,0.010831111007266574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,65536,0.05316088928116692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,1024,4096,0.014094221923086377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,10240,0.009642666412724389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,51200,0.04383111000061035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,16384,0.02204622162712945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,8192,0.00888888869020674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,7168,0.008643555144468943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,12288,0.018595554762416415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,6144,0.008344000412358178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,10240,0.0177848885456721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,5120,0.006919999917348226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,8192,0.016211556063758004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,7168,0.015449777245521545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,4096,0.007270221908887227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,3584,0.007198221981525421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,6144,0.0151235560576121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,3072,0.006903111106819577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,5120,0.014562666416168213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,2560,0.006333333336644703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,4096,0.013091555900043912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,2048,0.0052684446175893145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,3584,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,1536,0.004906666775544484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,3072,0.013345777988433838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,1024,0.004058666527271271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,768,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,2560,0.012755555411179861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,2048,0.012175111307038201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,512,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,1536,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,256,0.003142222141226133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,1024,0.012081777883900536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,128,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,768,0.012430222498046027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,512,0.011046222514576383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,256,0.010696888797812991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,32,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,128,0.011420444481902652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,65536,0.016926222377353244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,64,0.01039644413524204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,51200,0.014728888869285583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,16384,0.01038933296998342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,65536,0.05231822199291653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,51200,0.043783111704720386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,12288,0.008985777695973715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,16384,0.02093688812520769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,10240,0.007656888829337225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,8192,0.008664888640244802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,12288,0.018889778190188937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,10240,0.017493334081437852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,7168,0.00795111142926746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,8192,0.016166221764352586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,6144,0.007260444263617198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,5120,0.0069297779765393995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,7168,0.015513777732849121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,6144,0.01514933341079288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,4096,0.007259555160999298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,5120,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,3584,0.006636444479227066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,3072,0.006576889091067844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,4096,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,2560,0.00628355559375551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,3072,0.01312355531586541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,2048,0.005948444621430502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,768,64,0.0025173332542181015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,2560,0.013071999781661563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,1536,0.0042257776690853965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,1024,0.003891555385457145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,2048,0.012096888489193387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,768,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,1536,0.01239822225438224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,768,32,0.010178666975763109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,1024,0.011054221954610614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,512,0.003216888962520493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,256,0.003156444471743372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,768,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,128,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,512,0.010701333483060202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,64,0.0028231110837724474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,256,0.01072177787621816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,512,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,128,0.010739555789364709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,65536,0.015473778049151102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,32,0.009030222064918941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,51200,0.013432000246312885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,65536,0.04971111151907179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,16384,0.008676444490750631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,51200,0.040807998842663236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,3584,0.014087999860445658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,16384,0.02093511157565647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,12288,0.008159110943476358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,10240,0.0076044441925154785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,8192,0.006981333096822103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,7168,0.006637333167923822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,12288,0.01886133352915446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,10240,0.01788444485929277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,8192,0.015799111790127225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,6144,0.006583999842405319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,5120,0.005919999960396025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,7168,0.01551999979548984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,4096,0.005758222192525864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,3584,0.006204444501135085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,6144,0.01514844430817498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,5120,0.01444533301724328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,3072,0.006174222048785951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,4096,0.01310222182008955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,2560,0.006263999889294307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,2048,0.006121777825885349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,3072,0.01313066648112403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,1536,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,2560,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,1024,0.0038853333228164246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,2048,0.01276266657643848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,768,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,512,64,0.010474666953086853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,1536,0.012450666891203986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,512,0.0032142222755485107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,256,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,768,0.012120889292822944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,128,0.002570666579736604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,512,0.012042666474978128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,256,0.010685332947307162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,128,0.011420444481902652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,32,0.0028533333291610083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,64,0.010654222634103564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,65536,0.013901333014170328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,32,0.010371555884679159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,51200,0.01276622215906779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,65536,0.04827466607093811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,16384,0.007612444460391998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,51200,0.04085955686039395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,12288,0.007344889144102733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,16384,0.020587555236286588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,3584,0.013423110875818463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,10240,0.0069324444565508105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,8192,0.006586666736337874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,12288,0.018915555543369718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,10240,0.017148445049921673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,8192,0.016144000821643405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,6144,0.005906666732496685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,256,1024,0.01143022212717268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,7168,0.0151582227812873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,5120,0.006234666539563074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,4096,0.00555644432703654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,6144,0.014787554740905762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,256,64,0.0025333333760499954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,5120,0.013785777820481194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,3072,0.00564533347884814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,4096,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,2560,0.005895111295912001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,3584,0.013810666898886362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,2048,0.005903999838564131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,3072,0.01276088919904497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,1536,0.004523555437723796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,2560,0.012727999852763282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,1024,0.003871110992299186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,768,0.003448888866437806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,2048,0.012463111016485425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,512,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,1536,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,1024,0.011349333657158745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,256,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,768,0.011066666907734342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,128,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,64,0.002549333290921317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,512,0.011722666521867117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,32,0.002480888946188821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,256,0.010395555860466426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,128,0.010669333239396414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,65536,0.010694222317801582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,64,0.010075555907355415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,128,32,0.009661333428488838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,16384,0.0069884442620807225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,65536,0.047988444566726685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,51200,0.03994222150908576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,12288,0.00590133335855272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,16384,0.020966221888860066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,10240,0.006228444476922353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,12288,0.018194667167133756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,3584,0.0058666666348775225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,8192,0.005912000106440649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,10240,0.017518222332000732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,7168,0.005728000154097875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,6144,0.005665777872006099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,8192,0.016020443704393175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,5120,0.005598222215970357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,7168,0.015462223026487561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,4096,0.005555555638339784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,6144,0.01478488908873664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,3584,0.005736888696750005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,5120,0.014114666316244336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,3072,0.0052826665341854095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,4096,0.013767110804716745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,2560,0.005954666684071223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,3584,0.013408000270525614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,2048,0.005576000031497743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,3072,0.012797333300113678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,1536,0.004232888834344016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,2560,0.013061333033773633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,51200,0.009647111097971598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,2048,0.011768889096048145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,768,0.00349866681628757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,1536,0.01203733351495531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,512,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,1024,0.011438222395049201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,256,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,768,0.011359111302428775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,128,0.002599999929467837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,512,0.010724444356229572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,64,0.002502222235004107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,256,0.010384000009960597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,32,0.0024746666765875286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,128,0.010682666467295753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,65536,0.008984000318580205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,64,0.01055466632048289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,51200,0.008645333349704742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,16384,0.006232000059551663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,65536,0.047932446002960205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,51200,0.04002844293912252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,12288,0.005966222120655908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,10240,0.005883555445406172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,12288,0.018266666266653273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,8192,0.005594666633341048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,8192,0.015928000211715698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,7168,0.005971555494599872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,64,1024,0.0038933331767717996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,6144,0.005583111196756363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,128,7168,0.00628355559375551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,5120,0.005659555395444234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,7168,0.015230221880806817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,4096,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,6144,0.014828445182906257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,3584,0.005568888866239124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,5120,0.0148053334818946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,4096,0.013059555656380124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,3584,0.013757333159446716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,2560,0.005984888722499211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,3072,0.012734221915404001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,64,32,0.010010666317409938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,2048,0.0052844443255000645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,1536,0.004253333227501975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,2560,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,1024,0.0038524443904558816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,16384,0.020613332589467365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,1536,0.012040889097584618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,768,0.0033271111961868075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,512,0.0031893334041039148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,1024,0.011771555576059552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,10240,0.01687466601530711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,256,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,768,0.011439999772442712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,128,0.0028106667515304354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,512,0.010750222537252637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,64,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,32,0.0025315555847353404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,256,0.010064000056849586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,128,0.010967999696731567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,64,0.009713778065310584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,32,0.009562667045328353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,5,32,3072,0.005691555639108022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,16384,0.339391099082099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,51200,0.4947039816114638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,16384,0.23125688234965006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,5,32,2048,0.01199288914601008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,12288,0.2570097711351183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,51200,1.0108044942220051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,12288,0.1578880018658108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,10240,0.21745333406660292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,8192,0.16842222213745117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,10240,0.14517777495914036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,8192,0.12633600499894884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,7168,0.14647555351257324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,7168,0.10736888647079468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,12288,0.14467199643452963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,10240,0.12585155169169107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,6144,0.12818577554490831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,16384,0.18922932942708334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,6144,0.0959928896692064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,8192,0.10771199729707505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,5120,0.10279644197887844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,4096,0.08386755651897854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,5120,0.08566221925947402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,4096,0.06999733050664265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,3584,0.07276088661617704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,5120,0.07609155442979601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,6144,0.08569955825805664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,4096,0.06640977991951837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,7168,0.0959013303120931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,3072,0.0630177789264255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,3584,0.0653031137254503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,2560,0.053098665343390576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,3072,0.05420266588528951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,2048,0.04411733481619093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,2560,0.05102399984995524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,3584,0.06079555882347954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,3072,0.05540088812510172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,1536,0.03325244453218248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,2048,0.03952711158328586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,2560,0.050981332858403526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,1536,0.03576533330811395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,2048,0.04782488942146301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,768,0.01886666648917728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,1536,0.04093066520161099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,1024,0.023800000548362732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,1024,0.03552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,512,0.013757333159446716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,768,0.023173333870040044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,256,0.008737777670224508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,512,0.018618666463428073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,512,0.029806223180558946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,128,0.006227555374304454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,256,0.024996444582939148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,256,0.015736889508035447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,64,0.005882666756709416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,128,0.01481599940194024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,128,0.022672888305452134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,32,0.005603555589914322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,64,0.0143857780430052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,65536,32,0.013813333378897773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,65536,1024,0.02382844520939721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,65536,0.5231279797024196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,768,0.03132889005872939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,65536,0.9706498252020942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,65536,51200,0.5184666845533583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,51200,0.39736445744832355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,16384,0.25299021932813853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,51200,0.7547973526848687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,12288,0.19243644343482125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,16384,0.19049599435594347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,12288,0.12877244419521755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,10240,0.16084533267551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,10240,0.11316355069478352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,8192,0.0994524425930447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,8192,0.13285333580440944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,7168,0.1160728931427002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,12288,0.1206924385494656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,10240,0.10612177848815918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,7168,0.08888977766036987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,16384,0.15524978107876247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,8192,0.09099111292097305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,6144,0.0797520014974806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,5120,0.08909422159194946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,7168,0.08245155546400282
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,5120,0.07325600253211127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,4096,0.07331999805238512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,6144,0.0728364454375373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,4096,0.05965422259436714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,5120,0.06488088766733806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,3584,0.05382755398750305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,3072,0.0556924475563897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,4096,0.05657866928312513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,3584,0.05384799838066101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,6144,0.1013902227083842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,3072,0.04680622286266751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,2560,0.046578665574391685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,2048,0.037823110818862915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,2560,0.04430844386418661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,2560,0.04644711150063408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,2048,0.034212443563673235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,1536,0.02966488732231988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,2048,0.04317511121431986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,1024,0.020834666159417894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,1536,0.029726223813162908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,1536,0.03853066762288412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,768,0.015984889533784654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,3584,0.06348088714811537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,1024,0.02127733329931895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,1024,0.03188177943229675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,512,0.010990222295125326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,768,0.020909332566791113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,512,0.01722133325205909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,256,0.007277333074145847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,512,0.02847644355561998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,128,0.0038951109680864546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,256,0.025774222281244066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,768,0.030922667847739324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,3072,0.04923199945025974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,51200,0.41494933764139813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,128,0.014123555686738757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,64,0.003576000117593341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,51200,32,0.003528000166018804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,128,0.02201866606871287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,32,0.012274666792816587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,64,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,65536,0.3201564417945014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,65536,0.18291733000013563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,51200,65536,0.5259128676520454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,51200,0.24808979034423828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,16384,0.0855591098467509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,51200,0.13889511426289877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,12288,0.06630666388405694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,16384,0.0753199987941318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,51200,256,0.013986666997273764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,10240,0.05667822228537666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,12288,0.058916442924075656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,10240,0.04895200000868904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,12288,0.057427558634016246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,8192,0.04383200075891283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,16384,0.07003733184602526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,7168,0.037976887491014265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,10240,0.05496889021661547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,8192,0.04419022136264377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,6144,0.0329039990901947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,7168,0.03997777899106344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,8192,0.04770844512515598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,5120,0.02853155467245314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,7168,0.04603644543223911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,6144,0.040151112609439425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,4096,0.02331377731429206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,5120,0.032531556155946516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,6144,0.0410426656405131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,3584,0.020658666888872784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,51200,0.15688089529673258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,5120,0.03902577691608005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,4096,0.028380443652470905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,3072,0.018273777431911893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,4096,0.03584266702334086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,3584,0.02574311031235589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,65536,0.1929182211558024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,3584,0.03338222371207343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,2560,0.015494222442309061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,3072,0.024176888995700415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,3072,0.03144977821244134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,1536,0.010956444674068026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,2560,0.030057777961095173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,2560,0.0233324451578988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,2048,0.018943111101786297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,1024,0.008604444563388824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,1536,0.027453333139419556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,1536,0.018180444836616516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,768,0.007081777685218387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,512,0.004912888838185204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,1024,0.025256888733969793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,1024,0.015189333094490899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,256,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,768,0.014049778381983439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,512,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,512,0.02164711058139801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,128,0.0031840000301599503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,256,0.0124195557501581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,64,0.002887111157178879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,128,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,64,0.01146488885084788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,16384,32,0.009679111341635386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,65536,0.24368177519904244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,65536,0.15204711755116782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,16384,2048,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,2048,0.02951644526587592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,51200,0.1894328859117296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,16384,0.06718222300211589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,51200,0.12044089370303684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,768,0.023208889696333144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,12288,0.051817778084013194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,256,0.021720889541837905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,16384,0.06670311424467298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,16384,128,0.02090399960676829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,10240,0.04417066772778829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,16384,0.06001066499286228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,10240,0.0455022222465939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,8192,0.03904533386230469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,12288,0.049991998407575816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,7168,0.03467911150720384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,10240,0.04615288972854614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,8192,0.039368887742360435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,6144,0.030497776137457952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,8192,0.04224444429079691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,7168,0.035368889570236206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,5120,0.026541334059503343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,7168,0.03988533218701681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,6144,0.03473866648144192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,51200,0.1216942204369439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,65536,0.15299110942416722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,4096,0.022953778505325317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,6144,0.036664889918433294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,5120,0.03393777873780992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,3584,0.020464888877338834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,4096,0.026170666019121807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,3072,0.018019555343521964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,3584,0.02422044508987003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,3584,0.031045334206687078
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,2560,0.015599111715952555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,3072,0.02383822202682495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,3072,0.028991109795040552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,12288,0.05108355482419332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,2560,0.020233778489960563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,2048,0.013548444542619916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,1536,0.008762666748629676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,2048,0.018191110756662156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,2048,0.027111111415757075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,1024,0.0068400001360310455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,1536,0.017160000072585214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,1536,0.026769777139027912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,768,0.00554933316177792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,1024,0.013497778111033969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,1024,0.022295999858114455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,512,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,768,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,768,0.021291555629836187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,256,0.00342755557762252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,512,0.0217884447839525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,512,0.012290666500727335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,128,0.003148444410827425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,256,0.011360000405046674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,256,0.02161955502298143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,64,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,4096,0.03256888853179084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,128,0.019447111421161227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,128,0.011086222198274402
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,12288,32,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,32,0.009321778184837764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,65536,0.20471555656856963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,65536,0.14963911639319524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,51200,0.11558932728237575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,16384,0.05773599942525228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,16384,0.05615378088421292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,5120,0.02980533242225647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,12288,0.045243554645114474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,12288,0.04606577754020691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,16384,0.05494577685991923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,51200,0.10927022165722317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,12288,64,0.011029333704047732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,65536,0.13451911343468562
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,10240,0.03865244322352939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,8192,0.03269688950644599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,12288,2560,0.029273778200149536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,10240,0.041730665498309664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,8192,0.033639109796947904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,12288,0.04682577649752299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,7168,0.029123554627100628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,6144,0.026512889398468867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,8192,0.041096889310412936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,7168,0.03694399860170152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,5120,0.02278577784697215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,6144,0.02801688843303257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,6144,0.03549955619706048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,5120,0.025059555967648823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,4096,0.019560888409614563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,5120,0.03418311145570543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,3584,0.017605332864655387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,4096,0.022457778453826904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,4096,0.030304001437293157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,3072,0.016171556380059984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,3584,0.031039112144046362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,3584,0.021431111627154883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,2560,0.014540443817774454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,3072,0.019832000136375427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,3072,0.02901600135697259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,2048,0.010319111247857412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,2560,0.019276445110638935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,2560,0.028431998358832464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,1536,0.008986666798591614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,2048,0.027078222897317674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,2048,0.01679999960793389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,1024,0.006326222171386083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,1536,0.02751200066672431
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,1536,0.01664177742269304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,768,0.004566222015354368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,51200,0.16182843844095865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,1024,0.01276000009642707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,1024,0.022230222821235657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,512,0.003556444413132138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,768,0.022626666559113398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,768,0.013398222625255585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,256,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,10240,0.043175998661253184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,128,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,512,0.02132533325089349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,512,0.011696889168686338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,64,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,256,0.021617778473430212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,7168,0.030674666166305542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,10240,32,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,10240,128,0.019201777047581144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,128,0.011362666885058085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,256,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,64,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,10240,32,0.010015111002657149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,65536,0.1721200015809801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,51200,0.12993244330088297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,65536,0.10115733411577012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,16384,0.04686489038997226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,51200,0.07749244239595202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,12288,0.03338311115900675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,16384,0.0429440008269416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,12288,0.03638844357596503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,10240,0.028806222809685603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,16384,0.05260711246066623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,8192,0.023815110325813293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,10240,0.03234400020705329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,12288,0.04620711008707682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,7168,0.020720889170964558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,8192,0.027076444692081873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,8192,0.038273778226640486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,51200,0.10429600212309097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,6144,0.019077334139082167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,65536,0.125636445151435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,7168,0.036002665758132935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,5120,0.01612355477280087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,6144,0.02365333338578542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,6144,0.03429866830507914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,4096,0.013733333183659447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,5120,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,5120,0.032872888776991106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,3584,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,4096,0.019504000743230183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,3072,0.011207111179828644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,3584,0.029513776302337646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,3072,0.01761777698993683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,3072,0.028088887532552082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,2560,0.009916444619496664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,2560,0.027854220734702215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,2560,0.016781333420011733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,2048,0.00832088871134652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,2048,0.027057778504159715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,2048,0.015481778317027621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,10240,0.0427724454138014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,1536,0.006963555183675554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,1024,0.0058764442801475525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,1536,0.025007999605602686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,1536,0.014460444450378418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,768,0.004179555508825514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,1024,0.012058667010731168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,7168,0.025999110605981614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,512,0.003535110917356279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,1024,0.02271644439962175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,768,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,768,0.021976888179779053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,256,0.0031991110493739447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,512,0.02239022155602773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,512,0.012061333490742577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,128,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,4096,0.03088266650835673
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,256,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,256,0.020285333196322124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,64,0.002536888958679305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,8192,32,0.0028568889117903183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,3584,0.01886399918132358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,8192,128,0.02165066699186961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,128,0.01143555591503779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,64,0.010741333166758219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,8192,32,0.009668444593747457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,51200,0.1164346668455336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,65536,0.14715911282433405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,65536,0.0925146672460768
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,16384,0.04272177815437317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,51200,0.07131644752290514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,12288,0.03408711155255636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,16384,0.04486755530039469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,10240,0.029342220889197454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,12288,0.03527822097142538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,16384,0.05214666657977634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,12288,0.04597155584229363
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,8192,0.02498311135503981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,10240,0.029735998974906072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,7168,0.01907822158601549
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,10240,0.04150044586923387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,8192,0.02783999840418498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,6144,0.01751733322938283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,8192,0.03804711169666714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,51200,0.10407555765575832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,65536,0.12502222590976292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,5120,0.014984000060293408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,7168,0.03597955571280585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,4096,0.012475555141766867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,6144,0.023051554958025616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,6144,0.03417777683999803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,3584,0.011197333534558615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,5120,0.0329368876086341
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,5120,0.021249777740902368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,4096,0.018872888551818002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,4096,0.03119200136926439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,3072,0.01032977799574534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,2560,0.009486222432719337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,3584,0.030438221163219873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,3584,0.01847288840346866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,3072,0.02920711040496826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,3072,0.01715555621518029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,2048,0.007917332980367873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,2560,0.016869333055284288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,2560,0.02791822287771437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,1536,0.006696888970004187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,2048,0.014428445034556918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,2048,0.027874665127860174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,1024,0.004567999806669024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,1536,0.013983110586802164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,1536,0.024010666542583044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,768,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,1024,0.012784889174832238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,512,0.0035333335399627686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,768,0.022128888302379187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,256,0.0031742221779293488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,512,0.012068444656001197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,512,0.021551999780866835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,128,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,256,0.01036977767944336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,256,0.02199733257293701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,7168,0.024043555061022442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,64,0.0028648889727062653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,7168,32,0.002858666703104973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,128,0.011077333655622272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,128,0.020568889048364427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,64,0.010000000397364298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,32,0.010054222411579555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,65536,0.1272666719224718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,65536,0.08200533522499932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,51200,0.0967893335554335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,16384,0.03862222366862827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,51200,0.0649813347392612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,16384,0.037993778785069786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,12288,0.030414223670959473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,16384,0.05177155468198988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,7168,1024,0.021943999661339655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,10240,0.02569599946339925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,7168,768,0.012404444317022959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,12288,0.0322106679280599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,65536,0.12486844592624241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,51200,0.10274577803081936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,12288,0.04483288857671949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,10240,0.02870933214823405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,10240,0.04198933309978909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,7168,0.020080000162124634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,8192,0.025251555773946974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,8192,0.037408000893063016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,6144,0.01757777730623881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,7168,0.02330400049686432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,5120,0.015793777174419828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,7168,0.03581155671013726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,6144,0.033951110310024686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,4096,0.011624000138706632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,6144,0.022291556000709534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,5120,0.03239555491341485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,5120,0.020304888486862183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,3584,0.010212444596820408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,3072,0.009287999735938178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,4096,0.030233777231640283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,4096,0.018583110637134977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,3584,0.029488888051774766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,3584,0.01794577803876665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,3072,0.02853155467245314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,2048,0.007603555917739868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,2560,0.02747022277779049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,2560,0.016184889607959323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,1536,0.006500444478458828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,2048,0.01444355481200748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,2048,0.0262755552927653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,1024,0.0046951112647851305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,1536,0.013402666482660504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,1536,0.0236488895283805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,768,0.003567999849716822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,1024,0.012060444388124677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,1024,0.022277333670192297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,512,0.003391999958289994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,8192,0.022700443863868713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,768,0.012416889270146688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,256,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,512,0.02275377843115065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,512,0.01109777804878023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,128,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,256,0.01106844428512785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,256,0.021634666456116572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,64,0.002850666642189026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,128,0.011030221978823343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,32,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,64,0.010370666782061258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,6144,2560,0.008637333081828224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,32,0.009711999860074785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,65536,0.10837333069907294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,51200,0.08572089009814793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,65536,0.07555555635028414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,51200,0.05954222546683418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,16384,0.03369866808255514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,768,0.021945777866575453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,65536,0.12365244494544135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,16384,0.034929778840806745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,12288,0.027101332942644756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,51200,0.10260355472564697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,10240,0.022795556320084467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,16384,0.05130844314893087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,12288,0.04481600059403313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,6144,128,0.020253333780500624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,10240,0.0277511113219791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,10240,0.04036622246106466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,7168,0.017817777064111497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,8192,0.02421333392461141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,8192,0.03698488738801744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,6144,3072,0.016490666402710807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,7168,0.03548889027701484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,7168,0.022631110416518316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,5120,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,6144,0.022343110707071092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,4096,0.010657777388890585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,5120,0.03219022353490194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,4096,0.018002667360835604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,4096,0.03013155526585049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,3584,0.009347555538018545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,3584,0.029104888439178467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,3584,0.017157332764731515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,3072,0.008605333666006723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,3072,0.027747554911507502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,2560,0.00794488853878445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,12288,0.03021866745418972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,8192,0.020599111914634705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,2560,0.026156443688604567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,2048,0.013753777576817406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,6144,0.016582222448454965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,1536,0.00526311124364535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,2048,0.023990222149425085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,6144,0.03321155574586656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,1024,0.0041982221106688184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,1536,0.013769778112570444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,5120,0.019925332731670804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,768,0.0038284444146686127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,1024,0.02275200022591485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,1024,0.011777777638700275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,512,0.0031822222388452957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,768,0.011704888608720569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,768,0.022630222969584998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,256,0.0029493332323100832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,512,0.011065777805116443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,512,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,128,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,256,0.019910222954220243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,256,0.011379555695586734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,3072,0.015967999895413715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,64,0.002480888946188821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,32,0.002529777793420686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,128,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,128,0.018928888771269057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,64,0.010392888552612728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,65536,0.09012444151772393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,5120,2048,0.006766222417354584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,32,0.009321778184837764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,51200,0.0690222250090705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,65536,0.0691573354932997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,16384,0.02757511039574941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,51200,0.055014222860336304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,12288,0.02163999941613939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,16384,0.035931554105546736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,16384,0.050429334243138633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,5120,1536,0.023152000374264185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,10240,0.018552889426549275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,51200,0.10303644339243571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,12288,0.04332977864477369
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,65536,0.12379822466108535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,8192,0.016356445021099515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,7168,0.015022221538755627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,10240,0.026712889472643535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,10240,0.04029422336154514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,8192,0.02330044408639272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,6144,0.013052444491121503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,7168,0.02164711058139801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,7168,0.03524533245298598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,5120,0.012253333297040729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,6144,0.032906668053732976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,6144,0.02074399921629164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,4096,0.010932444698280759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,5120,0.0321760012043847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,3584,0.011351111034552256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,4096,0.029442667961120605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,4096,0.01720622181892395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,3072,0.01036444471942054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,5120,2560,0.015458666616015963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,3584,0.02793777651256985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,3584,0.01650044487582313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,2560,0.00923288861910502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,3072,0.014814222852389017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,3072,0.02683111031850179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,2048,0.007947555846638149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,2560,0.02437155610985226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,2560,0.014831999937693277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,1536,0.006647999915811751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,2048,0.023415111833148535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,2048,0.01311911145846049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,1024,0.004920888692140579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,1536,0.022312889496485393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,12288,0.028505778974956934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,768,0.0045422220395671
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,1024,0.021456888980335657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,768,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,8192,0.03681333197487725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,512,0.0038648889296584656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,256,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,512,0.011037333144081963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,5120,0.01944533321592543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,256,0.021031111478805542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,256,0.011018666956159802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,128,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,64,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,128,0.020989333589871723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,128,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,4096,32,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,64,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,65536,0.08121777905358209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,32,0.009565333525339762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,65536,0.06646666924158733
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,51200,0.06350577539867826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,1536,0.013472889032628802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,16384,0.02539288832081689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,4096,1024,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,51200,0.05350222190221151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,12288,0.01959288948112064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,16384,0.0318248901102278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,768,0.02159999973244137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,16384,0.05010133319430881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,10240,0.01759466694460975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,51200,0.10248533222410415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,8192,0.015199111567603217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,12288,0.02618933386272854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,12288,0.044159111049440175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,4096,512,0.022317333353890315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,10240,0.02405866649415758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,10240,0.040228443013297185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,6144,0.01274400038851632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,8192,0.037584000163608126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,8192,0.02217777735657162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,5120,0.011408000356621213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,7168,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,7168,0.03463110989994473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,4096,0.010371555884679159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,6144,0.034272889296213783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,6144,0.019588443968031142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,3584,0.01036800030204985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,5120,0.03247911069128249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,4096,0.029820445511076186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,4096,0.016201777590645682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,3072,0.009663999908500248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,3584,0.014575110541449653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,3584,0.028396444188223943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,2560,0.0083137775460879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,3072,0.026410667432679072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,3072,0.0141004439857271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,2048,0.007055111229419708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,2560,0.02437866727511088
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,1536,0.005879999862776862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,2048,0.012780444489585029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,1536,0.012422222230169507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,1536,0.0221733334991667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,1024,0.005205333232879639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,65536,0.12319378058115642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,1024,0.021597334080272253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,768,0.0041866666740841335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,1024,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,512,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,7168,0.013455111119482251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,768,0.021937777598698933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,768,0.011405333048767514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,256,0.0028408887899584244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,512,0.011003555523024665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,512,0.02200355629126231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,256,0.010724444356229572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,256,0.021262221866183813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,64,0.002483555633160803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,5120,0.018188445104493033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,128,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,64,0.01038577738735411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,65536,0.06982577509350248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,32,0.009348444640636444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,51200,0.054661333560943604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3584,2560,0.014914666612943014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,65536,0.06327288680606417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,16384,0.02183466653029124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,51200,0.05164177881346809
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,16384,0.03161688976817661
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,65536,0.12351289060380723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,12288,0.017941332525677152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,16384,0.05066755414009094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,51200,0.1035226649708218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,10240,0.01575555569595761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,12288,0.026155556241671245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,12288,0.04281599985228645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,10240,0.024077332682079736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,8192,0.013621333572599622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,10240,0.040820442967944674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,7168,0.012612444659074148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3584,128,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,8192,0.036983112494150795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,8192,0.02176622218555874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,6144,0.011620444556077322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,7168,0.019684443871180218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,7168,0.03490488727887472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,5120,0.01068800025516086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,128,0.01925244430700938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,6144,0.01955200069480472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,6144,0.03357955482270982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,4096,0.009563555320103964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,3584,0.009103111094898647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,5120,0.01774133410718706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,5120,0.031614220804638334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,3072,0.008997333546479544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,4096,0.027106665902667578
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,4096,0.015481778317027621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,2560,0.007603555917739868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,3584,0.028423110644022625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,3584,0.014706666270891825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,2048,0.006616000086069107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,3072,0.025174222058720056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3584,2048,0.024400000770886738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,2560,0.02407199972205692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,2560,0.013791110780504016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,1536,0.006728000111050076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,1024,0.004862222406599256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,2048,0.023014222582181294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,1536,0.02306488818592495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,1536,0.012375999655988483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,768,0.004559999952713649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,1024,0.021368889345063105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,1024,0.012096000214417776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,512,0.0041848888827694785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,768,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,256,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,512,0.0206631107462777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,256,0.020263999700546265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,256,0.010398222340477837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,128,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,128,0.019263111882739596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,64,0.002528888897763358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,64,0.009651555783218807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,3072,32,0.0028035555862718155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,3072,0.014107555150985718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,32,0.00868622213602066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,65536,0.0590933362642924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,2048,0.013155555559529198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,51200,0.04777155650986565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,65536,0.060812446806165904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,3072,768,0.02162666618824005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,51200,0.05011377731959025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,16384,0.01960266629854838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,65536,0.12401155630747478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,12288,0.015792000624868605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,16384,0.028160889943440754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,16384,0.04963289035691155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,10240,0.013904000322024027
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,12288,0.04392177859942118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,12288,0.025427555044492085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,128,0.011052444577217102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,8192,0.012141333685980903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,10240,0.02233155568440755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,7168,0.011630222201347351
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,10240,0.041237334410349526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,8192,0.020192000601026747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,6144,0.010885333021481832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,7168,0.0192266669538286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,6144,0.018260444204012554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,6144,0.032462222708596125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,5120,0.009579555855857002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,5120,0.03122488988770379
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,5120,0.016366221838527255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,4096,0.008952889177534316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,4096,0.02684177789423201
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,4096,0.014648889501889547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,3072,512,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,3584,0.008627555436558193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,3072,0.008204444415039485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,51200,0.10267377561993069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,3584,0.027078222897317674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,2560,0.00702044450574451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,3072,0.013586666848924426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,3072,0.025019556283950806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,2048,0.005935110979610019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,2560,0.023990222149425085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,2560,0.013586666848924426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,1536,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,2048,0.012410666379663678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,8192,0.036552889479531184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,1024,0.004564444637960858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,1536,0.012447111308574677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,7168,0.035311109489864774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,1536,0.02232444451914893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,768,0.004541333350870344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,1024,0.012334222594896952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,1024,0.022983999715911016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,512,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,768,0.011120888921949597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,768,0.022711111439598933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,256,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,512,0.022190221481853064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,512,0.01051644484202067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,128,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,256,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,64,0.002838222309947014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,128,0.02161955502298143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,128,0.010747555229398938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2560,32,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,65536,0.05185866687032911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,64,0.01033866653839747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,32,0.009316444396972656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2560,3584,0.013773333695199756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,51200,0.04111999935574002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,65536,0.05920888980229696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,16384,0.015785778562227886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,51200,0.048639999495612256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,65536,0.1244479947619968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,12288,0.01310400002532535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,16384,0.02479822271400028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,51200,0.10157510969373916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,2048,0.023327999644809302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,10240,0.011759999725553723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,12288,0.04361244373851352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,12288,0.022301332818137273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,10240,0.03970044520166185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,8192,0.011001778145631155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,10240,0.02160444524553087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,7168,0.011015111373530494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,8192,0.019362666540675692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,8192,0.03599822190072801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,7168,0.018477333916558158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,6144,0.009683555199040307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,5120,0.009309333231714036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2560,256,0.01994311147265964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,6144,0.03160533308982849
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,6144,0.01717155509524875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,4096,0.01033866653839747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,5120,0.01514311134815216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,5120,0.029383109675513372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,4096,0.014163555370436775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,4096,0.026717333330048457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,3072,0.006588444527652528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,3584,0.013802666631009845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,3584,0.02608888844648997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,2560,0.00591111100382275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,3072,0.013433777623706393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,3072,0.024716445141368445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,2048,0.006979555719428592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,2560,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,2048,0.012442666623327466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,1536,0.00572533326016532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,2048,0.023494222097926672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,1536,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,1536,0.022671999202834234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,1024,0.004563555535342959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,7168,0.03495733274353875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,1024,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,1024,0.021525333325068157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,768,0.0041964443193541635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,512,0.003547555456558863
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,768,0.02127733329931895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,768,0.011360000405046674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,256,0.0034844444857703317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,512,0.011361777782440186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,512,0.02091644373204973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,128,0.0028613333900769553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,256,0.021934222843911912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,256,0.01034311122364468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,64,0.002895111011134254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,128,0.010729778144094678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,128,0.02129511038462321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,32,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,64,0.01035377797153261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,65536,0.037441776858435735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,2560,0.023967110448413428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,2048,32,0.010048000348938836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,51200,0.030631999174753826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,2048,16384,0.049597332874933876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,65536,0.05710133579042223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,16384,0.013394667042626275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,51200,0.04719466633266873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,65536,0.12386222680409749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,12288,0.011576000187132092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,51200,0.10271733336978489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,16384,0.04934933450486925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,10240,0.010508444574144153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,12288,0.04366222355100843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,8192,0.010209778116808997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,10240,0.01941155559486813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,10240,0.0397093329164717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,7168,0.009534222384293875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,8192,0.017047999633683097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,2048,3584,0.009008888569143083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,7168,0.016536000702116225
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,6144,0.009039999710188972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,7168,0.033230221933788724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,5120,0.007762666377756331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,6144,0.015172445111804538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,5120,0.014783110883500842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,5120,0.028778665595584448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,4096,0.007304888632562425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,4096,0.013767999907334646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,16384,0.024894222617149353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,3584,0.007615110940403408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,4096,0.027279999521043565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,12288,0.02129511038462321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,3072,0.006237333433495627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,3584,0.026035555534892615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,3584,0.013086222112178802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,2560,0.005560889012283749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,3072,0.025069332785076563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,2048,0.006181333214044571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,2560,0.024121777878867254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,2560,0.01254488858911726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,1536,0.004922666483455234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,2048,0.022966222630606756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,2048,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,1024,0.004243555582231945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,1536,0.012078222301271228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,6144,0.03153689040078057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,1536,0.022292445103327434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,768,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,1024,0.021593777669800654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,1024,0.011395555403497485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,512,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,768,0.02272266646226247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,768,0.01108000013563368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,256,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,512,0.0206977774699529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,512,0.01074399964676963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,128,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,256,0.021635555558734473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,256,0.0107351111041175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,64,0.0028942223224374983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1536,32,0.0025617778301239014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,128,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,65536,0.02639466689692603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,64,0.009823111196359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,32,0.00945955514907837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,51200,0.02218577762444814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,65536,0.0547599991162618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,65536,0.12360178099738227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1536,3072,0.013225778109497495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,16384,0.015066666735543145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,51200,0.044544888867272266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,8192,0.0352497763103909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,12288,0.012514666550689273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,51200,0.10150933265686035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,10240,0.011295110815101199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,16384,0.04924266537030538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,16384,0.02363377809524536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,12288,0.019693333241674636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,8192,0.010547555155224271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,12288,0.04311022162437439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,7168,0.010025777750545079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,10240,0.03865689039230347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,10240,0.01757066614098019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,8192,0.03372622198528714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,6144,0.008350222474998897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,8192,0.016480889585283067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,7168,0.01590044465329912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,7168,0.03225333491961161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,6144,0.030414223670959473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,6144,0.015091554986106025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,4096,0.007319110963079665
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,5120,0.02847555610868666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,5120,0.014801777071423002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,3584,0.00685066646999783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,4096,0.027132444911532935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,4096,0.013452444639470843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,3072,0.0063075555695427795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1536,128,0.02028888960679372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,3584,0.02605688903066847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,2560,0.00590844452381134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,3072,0.01311288856797748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,2048,0.006577777779764599
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,2560,0.012422222230169507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,2048,0.012073777616024017
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,2048,0.022953778505325317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,1536,0.005578666511509154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,1536,0.011759111450778114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,1024,0.0052435555391841466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,1024,0.011387555963463254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,5120,0.008271111382378472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,1024,0.021271111236678228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,768,0.011076444553004371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,3584,0.01391377713945177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,768,0.02127733329931895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,512,0.003535110917356279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,3072,0.02502577834659153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,256,0.0032231110251612137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,2560,0.0240000006225374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,512,0.010767999622556897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,128,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,256,0.010407999985747868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,256,0.020246222615242004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,64,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,128,0.010728889041476779
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,128,0.02029600077205234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,1536,0.022109333011839125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,32,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,65536,0.021613332960340712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,64,0.009443555441167619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,1024,32,0.008971555365456475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,51200,0.018220444520314533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,65536,0.05288444293869866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,65536,0.12309955226050483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,1024,768,0.004204444587230682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,16384,0.010393777655230628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,51200,0.04368088973893059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,12288,0.010995555255148145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,16384,0.04847022228770786
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,16384,0.022015111313925848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,10240,0.00963288876745436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,12288,0.018541332748201158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,12288,0.04151555564668443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,8192,0.008984888593355814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,10240,0.01756088932355245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,10240,0.03743911120626662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,7168,0.00832711077398724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,1024,512,0.022311111291249592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,8192,0.016134222348531086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,8192,0.03413688805368211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,6144,0.008292444050312042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,7168,0.015465777781274585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,7168,0.03293244375122918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,5120,0.0069653333889113525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,6144,0.02978044417169359
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,4096,0.007360888852013483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,5120,0.028488000233968098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,5120,0.014800889624489678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,3584,0.00699733363257514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,4096,0.026675555441114638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,4096,0.013471110827393003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,3072,0.006619555668698416
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,3584,0.013822221921549903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,2560,0.006640888750553131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,3072,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,51200,0.10111466381284927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,2560,0.013091555900043912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,2560,0.0239982224173016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,2048,0.0052373334765434265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,1536,0.004923555586073133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,2048,0.02297244469324748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,2048,0.012738666600651212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,1024,0.0041955556306574075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,1536,0.012063999970753988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,1536,0.02195555633968777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,768,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,1024,0.012056888805495368
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,1024,0.021969777014520433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,512,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,768,0.011052444577217102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,768,0.02218755582968394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,256,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,512,0.010678222609890832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,6144,0.014829332629839579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,512,0.020936000678274367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,128,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,256,0.020602666669421725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,64,0.002532444480392668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,128,0.02091644373204973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,128,0.010690666735172272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,768,32,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,65536,0.01755555636352963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,3584,0.027416000763575237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,64,0.010013333625263637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,32,0.008647999829716152
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,768,3072,0.024205333656734888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,65536,0.05208888981077406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,65536,0.12347022692362468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,16384,0.011021333436171213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,51200,0.04339111182424757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,51200,0.10127022531297471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,12288,0.008979555633332994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,16384,0.04791288905673557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,16384,0.02163022259871165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,10240,0.008062221937709385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,12288,0.040227555566363864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,12288,0.01835644410716163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,8192,0.008285333712895712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,10240,0.01759733259677887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,7168,0.007999999655617608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,8192,0.03333066569434272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,7168,0.0318577786286672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,7168,0.015837333268589444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,6144,0.007262222468852997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,6144,0.02980355421702067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,768,256,0.01127822200457255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,5120,0.00664533343580034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,5120,0.0147724449634552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,5120,0.028498666154013738
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,4096,0.0070879997478591064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,51200,0.014818666709793938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,3584,0.006986666884687211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,4096,0.013435555828942193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,4096,0.027464888162083093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,3584,0.013078221844302284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,3584,0.026039999392297532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,3072,0.006579555571079254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,3072,0.012729778057999082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,2560,0.006249777972698212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,10240,0.037301331758499146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,8192,0.01591199967596266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,2048,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,2560,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,2560,0.024380443824662104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,1536,0.004534222185611725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,2048,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,2048,0.022673777408070032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,1024,0.003842666745185852
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,1536,0.011747555600272285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,6144,0.015275556180212231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,1536,0.021987555755509272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,768,0.003583999971548716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,1024,0.011385777758227454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,1024,0.021945777866575453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,512,0.003212444484233856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,768,0.022683555881182354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,768,0.01074577785200543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,256,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,512,0.010400888820489248
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,512,0.020977778567208186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,128,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,256,0.010434666441546546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,256,0.02168088820245531
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,64,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,512,32,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,128,0.010390222072601318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,128,0.020908445119857788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,65536,0.015095111396577625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,64,0.010371555884679159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,51200,0.013463111387358772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,512,32,0.008789333204428354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,512,3072,0.025192888246642217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,16384,0.008635555704434713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,65536,0.12160533004336888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,51200,0.04159466756714715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,51200,0.10019289122687446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,12288,0.00832711077398724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,16384,0.047044446070988975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,10240,0.007663999994595845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,12288,0.04164800047874451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,10240,0.01716800034046173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,10240,0.03852622376547919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,8192,0.0069191112286514705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,8192,0.03310133351220025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,8192,0.016501333978441026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,7168,0.006681777950790193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,6144,0.006523555351628198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,7168,0.03161244591077169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,7168,0.015825778245925903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,5120,0.005992888990375731
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,6144,0.01514933341079288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,6144,0.030136889881557886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,4096,0.005607999861240387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,5120,0.014827556080288358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,5120,0.03013955553372701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,3584,0.006265777680608962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,65536,0.05033333433998955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,4096,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,4096,0.027814222706688776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,3072,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,3584,0.026159110996458266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,3584,0.013455111119482251
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,2560,0.006232000059551663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,16384,0.02075199948416816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,3072,0.024341333243581984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,2048,0.00590844452381134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,12288,0.018235555953449674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,2560,0.012780444489585029
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,2560,0.024115555816226538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,1536,0.004230222354332606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,2048,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,1024,0.003879111260175705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,2048,0.02336799932850732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,768,0.0035208890007601846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,1536,0.023000889354281958
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,1536,0.01237422227859497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,1024,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,512,0.0032115555885765287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,768,0.011023999916182624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,768,0.02160177793767717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,256,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,512,0.02198933396074507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,512,0.010686222049925061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,128,0.0028106667515304354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,256,0.020625778370433383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,256,0.010386666489972008
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,64,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,256,32,0.002512000087234709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,128,0.02158311174975501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,128,0.010325333310498131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,65536,0.014306666122542487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,64,0.0103502223889033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,51200,0.01273155543539259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,32,0.009323555562231276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,65536,0.0482666658030616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,65536,0.12142844994862874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,16384,0.00794044468137953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,51200,0.040038221412234835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,51200,0.09916533364189996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,12288,0.0069422221018208405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,16384,0.046853333711624146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,16384,0.020733333296246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,10240,0.006978666616810693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,12288,0.018225777480337355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,12288,0.040392001469930015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,8192,0.006281777802440856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,10240,0.017512889371977914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,10240,0.03731022278467814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,256,1024,0.021597334080272253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,7168,0.006227555374304454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,8192,0.015801777442296345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,6144,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,7168,0.03189511100451151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,7168,0.015274667077594332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,5120,0.005736888696750005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,6144,0.01477777792347802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,6144,0.02978488802909851
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,4096,0.005590222362014983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,5120,0.014447111222479077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,5120,0.028777778148651123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,3584,0.005938666562239329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,4096,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,4096,0.02626488937271966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,3072,0.0059279998143513995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,3584,0.012837332983811697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,3584,0.02585244509908888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,2560,0.005610666755172942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,3072,0.01273333364062839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,3072,0.025032000409232244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,256,3072,0.013420444395807056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,2048,0.005544888890451855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,2560,0.012039999994966718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,2560,0.023644444015291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,1536,0.0042275554604000514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,2048,0.023385778069496155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,2048,0.012599999705950419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,1024,0.0038622220357259116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,1536,0.021968000464969214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,1536,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,768,0.003544888976547453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,1024,0.0217884447839525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,1024,0.012087999946541257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,8192,0.034612443712022566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,768,0.02111377815405528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,768,0.0107360002067354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,256,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,512,0.022293332550260756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,512,0.011412444214026133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,128,0.0025333333760499954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,256,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,256,0.01994044416480594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,64,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,32,0.002502222235004107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8_block,4,128,128,0.018938667244381376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,128,0.011693333586057028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,51200,0.009695111049546136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,32,0.00868888861603207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,128,64,0.009648888475365108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,16384,0.0069573331210348345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,65536,0.04896444413397047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,51200,0.04038577940728929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,16384,0.020578665865792167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,10240,0.005932444499598608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,8192,0.006615110983451207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,12288,0.018616000811258953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,7168,0.006604444649484422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,10240,0.01685333251953125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,6144,0.005959110955397288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,8192,0.015846222639083862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,5120,0.005948444621430502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,7168,0.015489778584904142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,4096,0.005572444448868434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,6144,0.014495111174053617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,3584,0.005617777920431561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,5120,0.01443822185198466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,3072,0.005895111295912001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,4096,0.014135110709402295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,128,512,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,2560,0.005983110931184556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,3584,0.013077333569526672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,3072,0.013421333498424955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,1536,0.004222222086456087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,2560,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,2048,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,65536,0.010037333601050908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,1536,0.01239733315176434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,768,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,1024,0.011078221930397881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,512,0.002895999906791581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,256,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,12288,0.005928888916969299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,768,0.011785777906576792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,128,0.0025191110455327565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,64,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,256,0.00999644481473499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,128,0.011409777734014722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,32,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,64,0.009993777506881291
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,65536,0.008720888859695857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,32,0.00997866690158844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,51200,0.00832444429397583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,65536,0.04788088798522949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,16384,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,51200,0.04038577940728929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,12288,0.006224000205596288
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,2048,0.00562755556570159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,10240,0.006263999889294307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,16384,0.020302222834693063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,8192,0.005346666607591841
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,12288,0.018519111805491976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,64,1024,0.0038248888320393036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,10240,0.017642666896184284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,6144,0.005598222215970357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,8192,0.01551555593808492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,5120,0.005571555760171678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,7168,0.015164444843928019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,4096,0.005224888937340842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,6144,0.015187554889255099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,3584,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,5120,0.013776000175211163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,64,512,0.010724444356229572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,3072,0.0052684446175893145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,4096,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,2560,0.00555288874440723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,2048,0.005573333137565189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,3584,0.013796444568369122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,3072,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,1536,0.004276444514592488
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,2560,0.012227555943859948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,1024,0.003866666720973121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,768,0.0033573332346147964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,2048,0.011697777443461947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,512,0.0031582222630580268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,1536,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,1024,0.011038222246699862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,256,0.002536888958679305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,128,0.0027057776848475137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,512,0.010070222119490305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,64,0.002524444419476721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,128,0.010392000277837118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,32,0.002537777854336633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,64,0.00999022192425198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,4,32,7168,0.006385777973466449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,32,0.008628444539176093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,16384,0.3358737892574734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,16384,0.25782932175530326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,12288,0.25802577866448295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,51200,0.49355464511447483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,10240,0.2177120049794515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,12288,0.18417155742645264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,768,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,8192,0.17615911695692274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,10240,0.13919377326965332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,4,32,256,0.010348444183667501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,7168,0.1467404497994317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,6144,0.1283982197443644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,7168,0.10408000151316325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,5120,0.10912888579898411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,6144,0.09821155336168076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,4096,0.09108622206581964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,5120,0.08321244186825223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,3584,0.07300177547666761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,4096,0.0699839989344279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,3584,0.062936888800727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,3072,0.06233955754174126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,2560,0.053451554642783276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,1536,0.033936000532574125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,2048,0.043374223841561206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,3072,0.05404444535573324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,1024,0.024029332730505202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,2048,0.04378488990995619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,768,0.018920888503392536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,1024,0.026378666361172993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,1536,0.03404533200793796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,768,0.02331200076474084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,256,0.008630221916569604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,128,0.0063973334100511335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,512,0.01925511161486308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,64,0.005621333503060871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,128,0.01402933398882548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,32,0.005894222193294101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,51200,1.0088755289713542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,256,0.016410667035314772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,32,0.013247110777431063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,8192,0.12192532751295303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,2560,0.05109955535994636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,65536,0.5219857957628038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,51200,0.39698221948411727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,65536,512,0.013734222286277346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,51200,0.7516355514526367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,12288,0.19202310509151885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,16384,0.17734755410088432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,12288,0.1317546632554796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,10240,0.1606408887439304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,8192,0.13228889306386313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,65536,64,0.01277599980433782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,10240,0.10963910818099976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,7168,0.1160000032848782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,6144,0.10043022367689346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,8192,0.12698045041826037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,7168,0.08507555723190308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,5120,0.08916266759236653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,4096,0.07298222515318128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,5120,0.08155822091632418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,3584,0.06309688753551908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,3072,0.05628799729877048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,3584,0.05351288782225715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,2560,0.046394666035970054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,4096,0.06563466787338257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,3072,0.04491644435458713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,2048,0.03769866625467936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,16384,0.24975289238823783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,65536,0.9683538013034396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,1536,0.02937777837117513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,1024,0.021253334151373968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,768,0.015787555111779105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,1024,0.02397955622937944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,1536,0.02870222263866001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,512,0.011400000088744693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,256,0.007238222493065729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,256,0.014502222339312235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,128,0.0038337777886125776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,6144,0.07750578059090509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,64,0.0032195556494924757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,768,0.021470222208235
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,128,0.012849777936935425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,51200,32,0.0034871109657817413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,64,0.012406222522258759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,32,0.012381333443853589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,65536,0.3202604452768962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,65536,0.17825778325398764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,51200,0.24887556499905059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,2560,0.04656711220741272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,16384,0.08576355377833049
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,2048,0.03783999880154928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,12288,0.06618311007817586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,10240,0.056906667020585805
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,16384,0.08397599723603989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,8192,0.04465599854787191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,51200,512,0.0184879998366038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,51200,0.13871288299560547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,7168,0.037648889753553606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,10240,0.05312088794178433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,6144,0.03284622232119242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,7168,0.039084444443384804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,5120,0.0281368891398112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,4096,0.023704888092146978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,12288,0.05680177609125773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,3584,0.020602666669421725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,6144,0.03509333398607042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,5120,0.03326755430963304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,3072,0.01827911039193471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,4096,0.02764355474048191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,2560,0.015876443849669564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,2048,0.013321778012646569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,3584,0.025714667307005987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,1536,0.010785777535703448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,3072,0.022797332869635686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,2560,0.022469333476490442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,1024,0.008283555507659912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,768,0.006908444480763541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,2048,0.020812445216708712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,512,0.004782222211360931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,1536,0.017845332622528076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,256,0.0035457776652442086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,128,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,768,0.013821333646774292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,512,0.013781333135233985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,16384,32,0.0028320000403457214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,256,0.012717333104875354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,128,0.011048888994587792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,64,0.011049778097205691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,32,0.010050666828950247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,65536,0.24334398905436197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,16384,0.06645066870583428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,65536,0.15303288565741643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,51200,0.1885768837398953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,12288,0.051290667719311185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,10240,0.04388088981310526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,51200,0.11998311678568523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,8192,0.03852355480194092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,12288,0.050738665792677135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,16384,0.06531466378106011
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,10240,0.04293244414859348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,8192,0.047057777643203735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,6144,0.0306915541489919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,7168,0.034536888202031456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,5120,0.026551999979548987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,4096,0.02332088847955068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,7168,0.03457333313094245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,6144,0.030569778548346624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,3072,0.017824000782436795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,4096,0.025942222939597234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,3584,0.024359110328886244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,2560,0.015862221519152325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,3072,0.020915556285116408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,2048,0.013748444616794586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,1024,0.015182221929232279
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,1536,0.008848889006508721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,2560,0.021495110458797876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,1024,0.006952889263629913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,2048,0.019096000327004325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,768,0.00591555568906996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,1536,0.016601777738995023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,512,0.0036880001425743103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,1024,0.014165333575672574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,256,0.0031555555760860443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,768,0.013100444442696042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,128,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,512,0.01275288893116845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,64,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,256,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,16384,8192,0.044236444764667086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,32,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,128,0.010040889183680216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,64,0.010079111489984725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,32,0.010188444621033138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,65536,0.2048106723361545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,65536,0.1490808857811822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,12288,3584,0.02036711076895396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,16384,0.05782666471269396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,12288,5120,0.02914311157332526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,12288,0.04484088884459602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,51200,0.11547111140357123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,10240,0.03874489002757602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,8192,0.03230399886767069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,16384,0.05214488837454054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,10240,0.04228977693451775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,12288,0.04402222235997518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,7168,0.029366221692827012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,8192,0.03355377912521362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,6144,0.026584888497988384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,5120,0.022628444764349196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,4096,0.01927199959754944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,7168,0.029465778006447688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,3584,0.017921777235137094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,6144,0.02700977855258518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,3072,0.015754666593339708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,5120,0.025447110335032146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,4096,0.02398577829202016
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,2560,0.014775110615624322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,2048,0.011024889018800525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,3584,0.021597334080272253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,1536,0.0090844440791342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,3072,0.018984888990720112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,1024,0.00656444455186526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,2560,0.019023999571800232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,768,0.004839999808205498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,2048,0.017975111802419026
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,512,0.00351555562681622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,1536,0.015096889601813423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,256,0.003149333306484752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,128,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,1024,0.013880000346236758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,768,0.013212444053755866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,64,0.002530666689078013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,512,0.01314399970902337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,32,0.0028133332315418455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,256,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,128,0.01074399964676963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,64,0.011072888970375061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,10240,32,0.010194666683673859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,65536,0.1726764440536499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,10240,51200,0.16016356150309244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,16384,0.04653777678807577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,51200,0.12782843907674155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,12288,0.03459022111362881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,10240,0.027622222900390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,51200,0.07734222544564141
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,8192,0.023741333021057978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,12288,0.036772443188561335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,16384,0.04806133442454868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,7168,0.020954666866196528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,6144,0.018960888187090557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,8192,0.027276444766256545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,10240,0.031353778309292264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,5120,0.016349333855840895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,4096,0.013906665974193148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,7168,0.02516888909869724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,3584,0.011861333416567909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,6144,0.022671999202834234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,5120,0.021976888179779053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,4096,0.02051111062367757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,2560,0.009649777577983009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,3584,0.019454222586419847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,2048,0.008271999657154083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,3072,0.01719111038578881
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,1536,0.007191999918884701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,2560,0.01735555628935496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,1024,0.005528000079923206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,2048,0.016171556380059984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,768,0.0041724443435668945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,512,0.0035582222044467926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,1536,0.013429332938459186
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,1024,0.013083555632167392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,256,0.0029893333299292457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,512,0.011408000356621213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,128,0.0028497777465316984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,256,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,64,0.0025333333760499954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,65536,0.09728266795476277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,128,0.010412444670995077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,32,0.002543111021320025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,64,0.01034311122364468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,32,0.009429333110650381
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,65536,0.146342224544949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,51200,0.11644711759355332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,8192,3072,0.010847999817795224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,16384,0.042451557185914784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,51200,0.0704524450831943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,12288,0.03346755438380771
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,16384,0.040347556273142494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,10240,0.02843466732237074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,12288,0.034895999564064875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,8192,0.025063110722435847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,10240,0.029678222205903795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,7168,0.01872977779971229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,8192,0.026752889156341553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,8192,768,0.012798222402731577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,6144,0.01680444512102339
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,5120,0.014519999424616495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,4096,0.013096888860066732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,3584,0.011352000137170156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,7168,0.023548444112141926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,6144,0.023211555348502264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,5120,0.021516443954573736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,4096,0.01873333255449931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,2560,0.008989333278603023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,2048,0.007628444168302748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,3584,0.018546667363908555
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,3072,0.01682222220632765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,1536,0.006908444480763541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,1024,0.0047066667013698155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,2048,0.01571822166442871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,768,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,1536,0.013423999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,1024,0.012464000119103326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,65536,0.09009510940975612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,768,0.012799999780125089
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,256,0.0032053333189752367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,128,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,512,0.011369778050316704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,64,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,256,0.011746666497654386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,128,0.01036088913679123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,32,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,64,0.01017155581050449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,65536,0.12528888384501138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,32,0.009368889033794403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,65536,0.08444711234834458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,51200,0.09816266430748834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,16384,0.037767112255096436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,12288,0.02981511089536879
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,3072,0.010263111028406356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,10240,0.025747555825445387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,16384,0.03778577844301859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,8192,0.0221377776728736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,7168,2560,0.016747555798954435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,12288,0.031005332867304485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,7168,0.0199991116921107
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,10240,0.027279110418425664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,6144,0.01797422269980113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,8192,0.025643555654419795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,5120,0.01575999955336253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,7168,512,0.0034977777136696708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,7168,0.02274399995803833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,4096,0.011847111086050669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,3584,0.010173333187898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,6144,0.021661332911915247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,3072,0.009240888886981541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,5120,0.020668443706300523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,2560,0.008525333470768398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,4096,0.01887999971707662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,3584,0.017824888229370117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,3072,0.01612977849112617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,1536,0.006153777655627992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,2560,0.016515556308958266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,1024,0.0041706665522522396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,2048,0.014498665928840637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,768,0.00350222239891688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,1536,0.013088000317414602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,512,0.0034906665484110513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,256,0.003167111012670729
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,1024,0.012410666379663678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,768,0.011383111278216044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,512,0.011760888828171624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,64,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,51200,0.06471200121773614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,128,0.01070755554570092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,64,0.009648888475365108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,65536,0.10674044158723618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,32,0.009314667019579146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,51200,0.08461688624487983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,65536,0.07571999894248115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,16384,0.0328800015979343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,51200,0.059122668372260205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,12288,0.026322666141721938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,16384,0.036976890431510076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,2048,0.007476444045702617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,10240,0.023128888673252527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,8192,0.019885333047972787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,12288,0.02998044424586826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,10240,0.02677333354949951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,7168,0.017885333961910672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,6144,0.01625333395269182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,8192,0.024915556112925213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,6144,128,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,6144,0.021311110920376245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,6144,256,0.010994666980372535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,4096,0.011022222538789114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,3584,0.009687999884287516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,5120,0.01998488936159346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,3072,0.008633777499198914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,4096,0.01793333391348521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,3584,0.017895110779338412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,3072,0.015807999504937064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,2048,0.006949333681000604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,2560,0.01514844430817498
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,1536,0.005260444349712796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,2048,0.014440000057220459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,1024,0.0038604442444112566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,1536,0.013069333301650153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,768,0.0038382220599386427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,1024,0.012446222205956778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,512,0.0035502223504914176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,768,0.011388444238238864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,256,0.0028897778441508612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,128,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,512,0.012412444584899478
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,64,0.0028453332682450614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,256,0.011426666544543372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,32,0.0025235555238193935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,7168,0.02231377859910329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,128,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,64,0.010394666757848527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,65536,0.09054844246970283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,51200,0.06990666521920098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,65536,0.06941511233647664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,16384,0.027662222584088642
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,2560,0.007699555820888943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,12288,0.021169778373506334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,51200,0.054583999845716685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,10240,0.01868088874551985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,16384,0.03171199891302321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,8192,0.01706755492422316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,7168,0.014747555057207743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,12288,0.0288080010149214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,6144,0.013256000147925483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,10240,0.02535466684235467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,5120,0.011870221959220039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,7168,0.021474666065639917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,4096,0.011036444041464063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,5120,0.019343111250135634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,3584,0.011343999869293638
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,4096,0.01752800080511305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,3072,0.01035733355416192
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,3584,0.016417778200573392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,2560,0.009071110851234859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,3072,0.014840889308187695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,2048,0.007859555383523306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,2560,0.014789332946141561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,1536,0.006238222122192383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,5120,32,0.009672889278994666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,2048,0.014119999276267158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,1024,0.004928888960017098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,768,0.004571555389298333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,1536,0.012738666600651212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,512,0.003846222327815162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,1024,0.01221866657336553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,256,0.003192000091075897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,768,0.011393778026103973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,128,0.0028355556229750314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,512,0.011034666664070554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,64,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,256,0.011781333221329583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,4096,32,0.0028577778074476454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,8192,0.02501511077086131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,64,0.010016889207892949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,6144,0.019923556182119582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,65536,0.07921510934829712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,32,0.009701333112186855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,51200,0.06301510996288724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,16384,0.025322667426533167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,12288,0.019932443896929424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,65536,0.0654017792807685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,10240,0.017322666115230985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,16384,0.03136444422933791
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,8192,0.01514488955338796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,12288,0.02786933382352193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,7168,0.014085332552591959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,5120,5120,0.014289778139856128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,10240,0.024061333802011278
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,8192,0.02199466692076789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,6144,0.012787555654843649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,5120,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,6144,0.01904088921017117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,4096,0.010483555495738983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,5120,0.01795022189617157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,3584,0.010348444183667501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,4096,0.015812445018026564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,3072,0.009560888840092553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,3584,0.01460088955031501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,2560,0.008271111382378472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,4096,128,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,3072,0.013470222552617392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,2048,0.007256888680987888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,1536,0.006236444330877728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,2560,0.014104000396198697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,1024,0.0046942221621672315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,2048,0.013059555656380124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,1536,0.0127368892232577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,768,0.0041751112374994485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,512,0.0038284444146686127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,1024,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,51200,0.052928000688552856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,256,0.002875555513633622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,768,0.011678222152921887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,128,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,512,0.011081777513027191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,64,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3584,32,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,256,0.011419555379284753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,128,0.010013333625263637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,65536,0.06775999731487699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,64,0.01035911093155543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,7168,0.020918221937285528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3584,32,0.008980444735950893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,16384,0.02156977852185567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,51200,0.05413866705364651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,12288,0.01792533364560869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,65536,0.06339999702241686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,10240,0.016163556112183463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,51200,0.051177776522106595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,16384,0.030233777231640283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,7168,0.01278222186697854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,12288,0.02602844436963399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,10240,0.023264888260099623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,8192,0.02200711104604933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,5120,0.011030221978823343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,7168,0.019523556033770244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,4096,0.009328000247478485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,6144,0.018834667073355783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,3584,0.00923733330435223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,5120,0.017673777209387887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,3072,0.008912000391218398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,4096,0.015291555060280694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,2560,0.008310221963458592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,2048,0.006558222075303395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,3072,0.01370666672786077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,2560,0.013767999907334646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,1536,0.007315555380450354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,1024,0.005046222358942032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,2048,0.01313777764638265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,768,0.004577777865860197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,1536,0.012221333053376941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,512,0.0042035554846127825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,768,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,256,0.0035084444615576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,512,0.011398221883508893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,128,0.003220444545149803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,256,0.011767999993430244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,8192,0.01350844403107961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,64,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,128,0.009988444546858469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,32,0.002530666689078013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,3072,6144,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,65536,0.05885689126120674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,64,0.01036177741156684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,32,0.008750222623348236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,51200,0.04675466815630595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,16384,0.01961599952644772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,65536,0.06065422296524048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,12288,0.015810666812790763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,51200,0.05003822180959913
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,10240,0.013967111706733704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,16384,0.027796443965699937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,8192,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,3584,0.014441778262456259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,7168,0.011524444652928246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,10240,0.022982221510675218
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,6144,0.01038755559258991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,5120,0.0099973330895106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,8192,0.020086222224765353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,4096,0.009008000294367472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,7168,0.018909333480728995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,3584,0.00850044439236323
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,5120,0.015826667348543804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,3072,0.008051555189821456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,4096,0.01493866741657257
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,3072,1024,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,2560,0.006620444357395172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,3584,0.013798221945762634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,2048,0.005936000082227919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,3072,0.013345777988433838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,2560,0.013410666750537025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,1536,0.005937777873542573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,2048,0.01277599980433782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,1024,0.004870222260554631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,768,0.004187555362780889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,1536,0.01241422196229299
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,1024,0.011420444481902652
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,768,0.011741333537631564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,256,0.0031866667171319327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,512,0.011368888947698804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,128,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,256,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,64,0.002530666689078013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,128,0.009732444253232744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,12288,0.024332443873087566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,32,0.00258577780591117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,64,0.0107342220014996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,65536,0.05097511079576281
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,32,0.009319999979601966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,51200,0.040568000740475126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2560,6144,0.01753155555990007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,16384,0.015793777174419828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,65536,0.058780444992913135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,12288,0.013583111266295115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,51200,0.04840444525082906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,10240,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,16384,0.025567111041810777
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,8192,0.011129777464601727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,12288,0.021568000316619873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,7168,0.010690666735172272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,10240,0.020399999287393358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,6144,0.009699555734793345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,8192,0.018776888648668926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,5120,0.009136888715955947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,4096,0.010183999935785929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,7168,0.01685688893000285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,3584,0.008996444443861643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,6144,0.015476443701320224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2560,512,0.0038533334930737815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,3072,0.006568000134494569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,2560,0.005702222386995952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,4096,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,2048,0.0069146665434042616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,3584,0.013691555294725629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,1536,0.005600000007285013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,3072,0.013101333545313941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,1024,0.004943111290534337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,2560,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,2048,0.012496000362767113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,1536,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,512,0.0038942222793896994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,1024,0.011397333608733283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,256,0.0035048888789282907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,768,0.011386666860845355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,128,0.0028417776856157514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,512,0.011397333608733283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,64,0.002524444419476721
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,256,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,128,0.00999111102686988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,64,0.010677333507272931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,32,0.008663111262851292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,65536,0.03631555702951219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,51200,0.030825777186287776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,65536,0.05697866943147448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,16384,0.013779555757840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,51200,0.04663377669122484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,12288,0.01142133358452055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,2048,5120,0.014855111638704935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,10240,0.010312000082598792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,16384,0.024123556084103052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,12288,0.0214346663819419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,10240,0.02012266715367635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,7168,0.009693333672152625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,768,0.0041759999261962045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,8192,0.016864889197879367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,6144,0.009011555876996782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,5120,0.007695111135641734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,4096,0.0074720001882976955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,6144,0.01517955627706316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,5120,0.014799111419253878
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,3584,0.006588444527652528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,4096,0.014132445057233175
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,3584,0.01408622165520986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,2048,32,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,2560,0.005939555664857228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,3072,0.013204444613721637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,2048,0.006231110956933763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,1536,0.005212444398138259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,2560,0.012786666552225748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,1024,0.004316444612211651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,1536,0.012788444757461548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,768,0.003839111162556542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,1024,0.011039999624093374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,512,0.00350577798154619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,768,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,256,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,512,0.011039999624093374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,128,0.002847111059559716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,256,0.011436444189813403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,128,0.01039644413524204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,7168,0.016050666570663452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,64,0.0026942222482628296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,32,0.002536888958679305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,3072,0.0064035554726918536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,65536,0.026762665973769292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,32,0.009357333183288574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,51200,0.022281777527597215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,65536,0.054040888945261635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,16384,0.014092443717850579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,51200,0.04450666573312548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,2048,0.012653333445390066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,12288,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,10240,0.011367999845080905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,16384,0.022336888644430373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,12288,0.018648000227080453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,8192,0.010035555395815108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,7168,0.00943999985853831
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,10240,0.017839999662505258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,6144,0.008588444855478074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,8192,0.016220443778567843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1536,8192,0.010212444596820408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,5120,0.007985778152942657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,7168,0.015517334143320719
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,4096,0.0074142225914531285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,6144,0.015180443723996481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,3584,0.006959999601046245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,3072,0.00657066661450598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,5120,0.014476444986131458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,4096,0.013150222599506378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,2560,0.005910222315125995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,3584,0.013819555441538492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,2048,0.007603555917739868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,3072,0.013122667041089801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,1536,0.006623111251327727
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,1024,0.004543999830881755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,2560,0.012961777547995249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,768,0.003910222401221593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1536,64,0.01036000003417333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,2048,0.012737777498033313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,512,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,1536,0.012523555921183692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,256,0.003169777699642711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,1024,0.011208000282446543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,128,0.0028595555987623003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,768,0.011013333168294696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,64,0.002556444456179937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,512,0.011754666765530905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,1024,32,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,256,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,65536,0.022264000442292955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,128,0.009723555710580613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,64,0.010048000348938836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,1024,32,0.009149333669079674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,16384,0.010392000277837118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,65536,0.0527724458111657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,12288,0.010671111444632212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,10240,0.009690666364298927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,12288,0.018925334016482036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,10240,0.017231111725171406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,7168,0.008339555727110969
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,8192,0.016142222616407607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,6144,0.008011555506123437
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,7168,0.0155102229780621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,5120,0.006707555717892117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,6144,0.014946666028764514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,4096,0.007254222200976477
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,5120,0.014159111513031853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,3584,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,4096,0.013136000268989138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,3072,0.006592000110281839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,3584,0.013524444566832649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,2560,0.006583111153708563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,3072,0.01278133359220293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,2048,0.005208888815508948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,51200,0.018533334136009216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,2560,0.01275111072593265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,1536,0.004927999857399198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,1024,0.0041706665522522396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,2048,0.012413333687517377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,51200,0.04368444283803304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,768,0.003998222036494149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,1536,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,16384,0.021262221866183813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,512,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,256,0.0028942223224374983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,8192,0.009346666435400644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,1024,0.011752888560295105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,64,0.002528000002106031
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,768,0.010838222172525195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,512,0.01070844464831882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,32,0.0024906665914588505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,128,0.011043555206722684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,65536,0.016806221670574613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,51200,0.014775110615624322
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,64,0.010374222364690568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,32,0.009301332963837517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,16384,0.011031111081441244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,12288,0.008651555412345463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,65536,0.05209155546294319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,51200,0.04349777764744229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,16384,0.02058577703105079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,12288,0.018560000591807894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,8192,0.0083155557513237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,10240,0.017180444465743173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,7168,0.007623111208279927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,8192,0.016247999336984422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,6144,0.007304000357786815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,7168,0.015462223026487561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,5120,0.006973333656787872
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,6144,0.014833778142929077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,4096,0.007304000357786815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,5120,0.013816888961527081
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,3584,0.006918222126033571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,768,128,0.002875555513633622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,3072,0.0069324444565508105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,3584,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,2560,0.006260444306664997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,3072,0.013402666482660504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,2048,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,1536,0.004353777815898259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,2560,0.012444444828563266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,1024,0.003891555385457145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,2048,0.012747555143303342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,10240,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,768,0.003504000190231535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,512,0.003175111073586676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,1024,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,256,0.0031395554542541504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,768,0.01089422239197625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,128,0.002604444407754474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,512,0.011725333001878528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,256,0.01072533345884747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,512,32,0.0028328889360030494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,128,0.01035288886891471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,65536,0.015465777781274585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,32,0.00903200027015474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,51200,0.013051555388503604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,65536,0.04907555712593926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,16384,0.008626666333940294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,4096,0.013992889059914483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,12288,0.00832266691658232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,51200,0.04043289025624593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,768,256,0.011024889018800525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,10240,0.007609777980380588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,16384,0.020632000433074105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,12288,0.01852888862291972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,7168,0.006792000184456508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,10240,0.017198221551047433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,8192,0.016022221909628976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,6144,0.006252444452709622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,5120,0.005964444329341252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,7168,0.015772443678643968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,1536,0.011730666789743634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,4096,0.005663110978073544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,6144,0.01484266585773892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,3584,0.006284444282452266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,5120,0.014119999276267158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,3072,0.006048000107208888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,2560,0.006600889066855113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,4096,0.01312355531586541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,3584,0.013403555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,2048,0.005906666732496685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,3072,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,1536,0.0041680000722408295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,2560,0.013066666821638743
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,1024,0.0038373333712418876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,768,0.003532444437344869
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,2048,0.012116444607575735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,1536,0.011776888536082374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,1024,0.01205244412024816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,256,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,768,0.011051555474599203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,128,0.002855111120475663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,512,0.011364444262451597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,64,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,256,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,32,0.002530666689078013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,64,0.009328000247478485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,8192,0.0069431112044387394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,65536,0.013735999663670858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,32,0.009694221946928237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,65536,0.047954665289984814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,51200,0.04034488730960422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,16384,0.007613333563009898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,12288,0.007282666862010956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,16384,0.020961778031455144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,12288,0.018211555149820115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,10240,0.016951999730534024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,8192,0.006579555571079254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,512,64,0.010024000373151567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,7168,0.006588444527652528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,8192,0.015463999576038785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,6144,0.0059368887709246735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,7168,0.015490666031837463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,5120,0.005897777775923411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,256,128,0.009700444837411245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,6144,0.014136888914638095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,4096,0.005606222069925732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,5120,0.014493332968817817
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,3584,0.005962666538026597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,4096,0.013106666505336761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,3072,0.005582222094138463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,3584,0.013748444616794586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,2560,0.00590844452381134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,3072,0.012429333395428128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,2048,0.00554933316177792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,10240,0.0069520001610120135
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,2560,0.012924444344308643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,1536,0.0041751112374994485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,2048,0.011746666497654386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,1024,0.00388355553150177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,768,0.003478222423129611
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,1536,0.012449777788586087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,1024,0.011021333436171213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,512,0.0031431110368834603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,256,512,0.0031617778456873367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,768,0.011752000285519494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,128,0.00282577777074443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,512,0.011018666956159802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,256,0.011040888726711273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,64,0.002504000026318762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,128,0.011043555206722684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,32,0.002520888836847411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,65536,0.010330666270520952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,64,0.009999111294746399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,128,32,0.009717333647939894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,65536,0.04788622260093689
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,51200,0.0127368892232577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,16384,0.0069546666410234236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,12288,0.005927111125654644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,51200,0.04015555646684434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,10240,0.006265777680608962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,16384,0.020271110865804885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,8192,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,7168,0.006559999866618051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,10240,0.016823111308945548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,6144,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,8192,0.015810666812790763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,5120,0.005277333160241445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,6144,0.014156444205178155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,4096,0.005583999885453119
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,5120,0.014099554883109199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,3584,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,128,256,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,4096,0.013067555924256643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,3072,0.005902222047249476
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,2560,0.0059057776298787855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,3072,0.012551111479600271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,2048,0.005621333503060871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,2560,0.012801777985360889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,1536,0.0042408886882993905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,51200,0.009663110805882348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,1024,0.0035297779573334586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,2048,0.01202133297920227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,1536,0.0124177775449223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,1024,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,512,0.002874666617976295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,768,0.011884444289737277
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,256,0.0028275555620590844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,12288,0.018135999639829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,128,0.002507555608948072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,512,0.01068800025516086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,64,0.0024746666765875286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,256,0.01108977778090371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,7168,0.015524443652894763
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,128,0.009705777797434065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,32,0.00249777775671747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,65536,0.009007111191749573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,64,0.010009778042634329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,51200,0.008275555239783393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,32,0.009687110781669617
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,16384,0.006218666831652324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,65536,0.04829244481192695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,12288,0.006604444649484422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,10240,0.005560889012283749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,51200,0.040018667777379356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,16384,0.02090666691462199
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,64,3584,0.012791111237472959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,12288,0.018194667167133756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,7168,0.005555555638339784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,10240,0.017231111725171406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,6144,0.005625777774386936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,5120,0.0052266667286554975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,8192,0.016136889656384785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,4096,0.005927111125654644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,7168,0.015112888481881885
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,3584,0.005872000008821487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,6144,0.014848000473446317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,3072,0.005571555760171678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,5120,0.013815110756291283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,2560,0.00554666668176651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,4096,0.013784888717863293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,64,768,0.0034959999223550162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,2048,0.005919111271699269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,1536,0.004507555729813046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,3072,0.01314222233162986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,1024,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,2560,0.012721777790122561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,2048,0.011877333124478659
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,768,0.003176888864901331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,1536,0.012466666599114736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,512,0.0032177778581778207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,1024,0.011077333655622272
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,256,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,768,0.010695111420419482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,128,0.0025271111064487034
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,512,0.011400889191362592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,64,0.002814222127199173
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,256,0.010755555497275459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,32,0.002469333302643564
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,128,0.010688888529936472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,64,0.010671999719407825
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,32,0.00833333366447025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,3,32,8192,0.0052728888889153796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,16384,0.19247289498647055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,16384,0.3358160124884711
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,3,32,3584,0.01292622254954444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,51200,0.5209671126471626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,12288,0.2569199932946099
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,10240,0.21430133448706734
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,12288,0.16104266378614637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,10240,0.13457511530982122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,8192,0.1763786607318454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,7168,0.14614578088124594
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,8192,0.12183022499084473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,6144,0.12671377923753527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,5120,0.10764266384972467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,6144,0.10538488626480103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,7168,0.10712977912690903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,5120,0.08096710840861003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,3584,0.07139999998940362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,4096,0.07011466556125216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,3072,0.061837335427602134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,3584,0.06698311037487455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,2560,0.053351110882229276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,3072,0.05490488807360331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,2560,0.04997600118319193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,2048,0.039665778477986656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,1024,0.024005333582560223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,51200,1.0154444376627605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,1536,0.035360889302359685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,768,0.018617777360810172
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,512,0.013693333499961428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,1024,0.027143999934196472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,256,0.008742222355471717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,768,0.02299733294381036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,256,0.016706667012638517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,128,0.006215999937719769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,4096,0.09079200029373169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,128,0.013787555197874704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,512,0.018831999765502084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,32,0.0059075554211934405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,64,0.012695111334323883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,65536,32,0.012789333032237159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,2048,0.04347733325428433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,1536,0.03342133429315355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,16384,0.24896444214714897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,65536,0.5198915799458822
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,51200,0.41695555051167804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,12288,0.19019733534918892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,51200,0.7522266705830892
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,65536,0.9673208660549588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,65536,64,0.005600000007285013
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,16384,0.19220356146494547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,12288,0.12764622105492487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,10240,0.15881510575612387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,8192,0.13097333908081055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,10240,0.11500977145300971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,6144,0.0998693307240804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,8192,0.1016426682472229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,5120,0.08832889133029515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,7168,0.0872960024409824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,4096,0.07041688760121663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,3584,0.06273511383268568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,4096,0.06050044298171997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,3072,0.05452177921930949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,3584,0.05647022194332547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,6144,0.07957422071033053
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,2048,0.037245333194732666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,3072,0.053808887799580894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,1536,0.029493331909179688
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,2560,0.04199999901983473
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,2048,0.03408266769515143
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,1024,0.02088177700837453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,768,0.01571111049917009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,1024,0.023670223024156358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,512,0.011429333024554782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,7168,0.1146355602476332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,1536,0.02999733222855462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,768,0.02104088829623328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,512,0.01789066692193349
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,256,0.007600888609886169
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,128,0.003906666818592283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,64,0.0033075554917256036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,256,0.014326221413082547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,128,0.01309866706530253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,64,0.01237777786122428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,32,0.0033928888539473214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,32,0.011986666255527072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,51200,5120,0.06760088602701823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,65536,0.3218017684088813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,65536,0.17854755454593232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,51200,2560,0.0453342232439253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,51200,0.24654134114583334
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,12288,0.06490933232837252
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,16384,0.08570755852593316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,10240,0.056442664729224316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,16384,0.07166666454739042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,12288,0.05819466378953722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,51200,0.1766035556793213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,6144,0.032229334115982056
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,7168,0.03929600119590759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,5120,0.02913155489497715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,7168,0.03860355416933695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,4096,0.023997333314683702
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,6144,0.037422223223580256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,10240,0.051177776522106595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,5120,0.03018666638268365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,4096,0.02730133301681942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,3584,0.026740445031060114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,2560,0.016162667009565566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,3072,0.024841777152485315
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,3072,0.018904000520706177
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,2048,0.014089778065681458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,1536,0.01108266661564509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,2560,0.021756443712446425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,2048,0.01862044466866387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,1024,0.008714666797055138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,768,0.006903111106819577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,1536,0.0177839994430542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,512,0.00489777781897121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,1024,0.01533600025706821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,768,0.014484445254007975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,512,0.011778666741318174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,8192,0.04414755437109205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,128,0.0031537777847713898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,64,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,128,0.011042666931947073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,8192,0.04470400015513102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,64,0.010070222119490305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,32,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,3584,0.021551999780866835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,32,0.010355555348926121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,65536,0.24135732650756836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,65536,0.1556062168545193
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,16384,0.06640266709857516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,51200,0.18830577532450357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,51200,0.16057777404785156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,12288,0.05166755451096428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,16384,0.07310222254859076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,10240,0.04380977816051907
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,8192,0.03849244448873732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,12288,0.049490667051739164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,10240,0.044884443283081055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,7168,0.034330666065216064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,8192,0.039792001247406006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,6144,0.030238221089045208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,5120,0.026671111583709717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,16384,256,0.0034764446318149567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,4096,0.022330666581789654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,6144,0.032749334971110024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,7168,0.0344782206747267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,3584,0.020234665936893888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,16384,256,0.0123848890264829
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,4096,0.025474665893448725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,3072,0.018195556269751657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,2560,0.015935111376974318
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,2048,0.013507555756303998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,1536,0.008962666822804345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,3584,0.02481422159406874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,3072,0.02348800003528595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,2560,0.01976355579164293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,1024,0.007261333366235097
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,2048,0.01829688913292355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,768,0.006171555568774541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,512,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,1536,0.01667022208372752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,256,0.003137777869900068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,1024,0.014039999908871122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,128,0.002871111035346985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,768,0.014466666513019137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,64,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,512,0.012729778057999082
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,12288,32,0.0028515555378463534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,256,0.011427555647161273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,64,0.010715555813577441
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,128,0.01074488874938753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,32,0.01035199976629681
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,65536,0.20285867320166695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,16384,0.05686399671766493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,51200,0.16033332877688938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,12288,0.044106665584776134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,51200,0.1373600032594469
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,10240,0.03843199875619676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,16384,0.0539591113726298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,12288,0.04455822375085619
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,8192,0.03223022156291538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,10240,0.0395706660217709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,7168,0.029414223300086126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,8192,0.033486220571729876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,6144,0.02571288910177019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,5120,0.02260444396071964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,7168,0.03021866745418972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,4096,0.019573332534896005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,6144,0.028953777419196233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,3584,0.017210667332013447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,5120,0.02481866710715824
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,3072,0.015993777248594496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,4096,0.02247911029391819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,2560,0.014098667436175875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,3584,0.022637334134843614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,2048,0.010141332944234213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,3072,0.020124443703227572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,2560,0.01777777738041348
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,2048,0.017639999588330586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,1024,0.006447111152940326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,768,0.004567111117972268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,1536,0.01585155559910668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,512,0.003590222034189436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,1024,0.013812444276279874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,256,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,768,0.01279022213485506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,65536,0.14629956086476645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,128,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,64,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,256,0.012048000262843238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,32,0.0028239999794297745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,128,0.010021333065297868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,64,0.009362666971153682
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,32,0.009726222190592024
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,65536,0.17127554946475557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,12288,5120,0.027707555227809485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,65536,0.09850044382943048
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,51200,0.12798666954040527
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,16384,0.04668177829848396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,12288,0.03615999884075589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,10240,0.030243555704752605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,16384,0.04282666577233208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,51200,0.10098666614956325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,8192,0.023631999890009563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,10240,1536,0.008519111408127679
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,7168,0.020670221911536325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,10240,0.03219022353490194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,8192,0.026133333643277485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,6144,0.01851288808716668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,5120,0.01718755563100179
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,7168,0.025418667329682246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,4096,0.014767110347747803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,3584,0.01295733369059033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,5120,0.020745777421527438
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,4096,0.019588443968031142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,10240,512,0.012755555411179861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,3072,0.010999999940395355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,3584,0.018590221802393597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,2560,0.010026666853162978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,2048,0.008867555194430882
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,1536,0.007231111327807109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,3072,0.017826666434605915
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,2560,0.01629333363638984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,1024,0.0058266665372583605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,2048,0.015549333559142219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,768,0.004206222378545337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,512,0.0035137778355015647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,1536,0.013981334037250943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,256,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,768,0.01311555587583118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,128,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,512,0.011390222443474663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,64,0.002493333278430833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,256,0.011353777514563667
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,8192,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,128,0.010412444670995077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,64,0.01000711073478063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,12288,0.035599999957614474
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,32,0.009038222332795462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,65536,0.1467911137474908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,51200,0.11501510938008626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,16384,0.04204622242185804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,65536,0.09116977453231812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,12288,0.03336355421278212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,51200,0.09045600228839451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,6144,0.02473955518669552
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,10240,0.028775999943415325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,16384,0.04025600022739834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,8192,0.02516888909869724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,7168,0.019720888800091214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,10240,0.0299217767185635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,6144,0.01753777762254079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,8192,0.026912000444200303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,7168,0.025040000677108765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,4096,0.013470222552617392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,6144,0.02255288925435808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,3584,0.011529777612951068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,5120,0.021067554752031963
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,3072,0.0103511114915212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,8192,1024,0.01236977759334776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,4096,0.019152000546455383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,2560,0.009302222066455418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,3584,0.018225777480337355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,3072,0.017846221725145977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,2048,0.007968000239796108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,2560,0.016107555892732408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,2048,0.014621333943472968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,1024,0.00488711107108328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,1536,0.01329422245422999
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,768,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,1024,0.01311466677321328
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,512,0.003719999972316954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,768,0.012423999607563019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,256,0.0031662223239739737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,12288,0.03616088959905837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,512,0.012164444559150271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,128,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,256,0.011060444845093621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,64,0.00281866660548581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,32,0.0029760001020299066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,5120,0.015111999379263984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,64,0.009344889058007134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,32,0.009661333428488838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,65536,0.12357866764068604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,51200,0.10011644495858087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,65536,0.08194755845599704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,16384,0.03750844465361701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,12288,0.029772443903817072
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,7168,1536,0.0069022224181228215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,51200,0.08667555782530044
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,16384,0.03864444295565287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,10240,0.025584888127115037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,8192,0.022288888692855835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,7168,0.019896000623703003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,12288,0.03251288996802436
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,6144,0.017501332693629794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,10240,0.027791112661361694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,5120,0.016014221641752455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,8192,0.024688889582951862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,4096,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,7168,0.02274399995803833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,3584,0.010313777459992303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,6144,0.021944888763957556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,3072,0.009375111096435124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,5120,0.019278221660190158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,2560,0.008512000242869059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,4096,0.018023111753993563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,2048,0.007251555720965068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,3584,0.01813155578242408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,1536,0.0064026667839950984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,1024,0.004293333325121137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,2560,0.01479022204875946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,2048,0.013424889081054263
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,768,0.003866666720973121
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,512,0.0031893334041039148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,1024,0.012051555845472546
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,256,0.0032035555276605818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,768,0.012082666986518435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,128,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,512,0.011038222246699862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,64,0.002532444480392668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,256,0.011076444553004371
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,6144,32,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,128,0.009658666948477427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,64,0.009161777794361115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,32,0.009351111120647853
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,65536,0.1058880024486118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,51200,0.08530044555664062
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,65536,0.0744675530327691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,16384,0.032115555471844144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,51200,0.08080622222688463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,12288,0.026661333110597398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,16384,0.03695733348528544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,10240,0.022950222094853718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,8192,0.01992266707950168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,12288,0.030461334519916113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,7168,0.01812533371978336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,10240,0.02776266634464264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,8192,0.02435644467671712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,3072,0.017157332764731515
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,6144,0.016081778539551627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,5120,0.014088888963063559
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,4096,0.010771555205186209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,6144,1536,0.01312800000111262
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,6144,0.020966221888860066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,3584,0.00962488849957784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,3072,0.008623999853928884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,5120,0.018971555762820773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,7168,128,0.01039644413524204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,2560,0.007827555967701806
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,4096,0.018199111024538677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,2048,0.006908444480763541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,3584,0.017512889371977914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,1536,0.005573333137565189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,3072,0.016504888733228047
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,1024,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,2560,0.014190221826235453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,768,0.003522666792074839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,2048,0.013120888835854001
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,512,0.003510222252872255
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,1536,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,256,0.002883555574549569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,1024,0.011409777734014722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,768,0.012468444804350534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,128,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,512,0.011039999624093374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,64,0.0024986666523747975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,256,0.011081777513027191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,5120,32,0.002492444382773505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,128,0.010372444159454769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,64,0.009709333380063375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,65536,0.08995288610458374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,32,0.00868000007337994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,51200,0.06871733400556776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,16384,0.027464000715149775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,65536,0.06912000311745538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,51200,0.07317688730027941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,16384,0.033378667301601835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,10240,0.018418666389253404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,8192,0.016335111525323655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,12288,0.02822222312291463
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,7168,0.015171556009186639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,10240,0.026735110415352717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,5120,7168,0.022924444741672937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,6144,0.013398222625255585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,8192,0.023390221926901076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,5120,0.01202133297920227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,4096,0.0107004443804423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,6144,0.020425778296258714
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,5120,0.01872711049185859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,4096,0.017529777354664274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,3072,0.010317333042621613
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,3584,0.016180444094869826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,2560,0.01033333357837465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,3072,0.015299555328157214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,2048,0.007832888927724626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,2560,0.013430222041077085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,1536,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,2048,0.013064000341627332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,1024,0.00589155571328269
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,1536,0.01278133359220293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,12288,0.021962665849261816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,768,0.004883555488453971
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,512,0.004197333421972063
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,1024,0.011762667033407422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,256,0.003177777760558658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,768,0.01183199965291553
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,512,0.010667555862002902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,128,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,64,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,256,0.011352000137170156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,32,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,128,0.010015111002657149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,7168,0.021976000732845728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,64,0.00903555585278405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,65536,0.07873333162731595
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,4096,32,0.009666666388511658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,51200,0.06348355611165364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,16384,0.025029333101378545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,65536,0.06575110885832045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,51200,0.06727821959389581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,10240,0.017156443662113614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,12288,0.027820444769329492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,8192,0.0151591118839052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,10240,0.024919999970330134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,7168,0.014072888427310519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,8192,0.022693332698610093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,6144,0.013381332986884646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,7168,0.020287111401557922
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,5120,0.011647111011876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,6144,0.020063999626371596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,4096,0.010867555936177572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,5120,0.017864000466134813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,3584,0.010323555933104621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,4096,0.016513778103722464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,3072,0.010973333484596677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,3584,0.015262222952312894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,4096,3584,0.01202755586968528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,2560,0.008285333712895712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,3072,0.014932443698247274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,2048,0.006923555499977536
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,1536,0.005894222193294101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,12288,0.020201777418454487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,1024,0.00453955555955569
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,2560,0.012788444757461548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,2048,0.01354311075475481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,16384,0.031203554736243352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,768,0.004564444637960858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,512,0.004041777716742622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,1536,0.012392000191741519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,256,0.003157333367400699
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,128,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,1024,0.011385777758227454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,64,0.00253866674999396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3584,32,0.0028391112056043413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,768,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,256,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,128,0.00964355551534229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,64,0.009671111073758867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,65536,0.06465599934260051
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,51200,0.054640889167785645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,32,0.009319999979601966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,16384,0.02113866640461816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,12288,0.017433777451515198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,65536,0.06278844674428304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,10240,0.015867556134859722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,51200,0.06721066766315036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,16384,0.030328889687856037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,8192,0.013440888788965015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,7168,0.012813333008024426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,12288,0.02459999918937683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,10240,0.02310488952530755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,6144,0.011687999798191918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,5120,0.01039644413524204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,7168,0.019660444723235238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,4096,0.009664889011118147
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,6144,0.018598222070270114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,5120,0.016516443755891588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,3584,0.008991999758614434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,3072,0.009327111144860586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,4096,0.01518311103185018
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,2560,0.007648888561460707
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,3584,0.014478221535682678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,3072,0.01405244403415256
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,2048,0.006286222073766921
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,1536,0.006028444402747684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,2560,0.013072888884279462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,1024,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,2048,0.01310488912794325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,1536,0.012727110750145383
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,768,0.0041964443193541635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3584,512,0.01071911139620675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,512,0.0038693332009845306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,256,0.0035386664999855887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,1024,0.011371555427710215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,128,0.0032151111712058387
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,768,0.011767999993430244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,512,0.010692444112565784
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,64,0.0028657778683635923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,3072,32,0.0028435554769304064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,128,0.01039644413524204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,64,0.008976889153321585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,65536,0.06029511160320706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,32,0.009873777627944946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,51200,0.04667466547754076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,16384,0.0196106665664249
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,65536,0.06044266621271769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,12288,0.015815110670195687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,51200,0.05922933419545492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,10240,0.014426666829321118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,16384,0.029280887709723577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,8192,0.01255022237698237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,7168,0.011751111182901593
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,12288,0.024328889118300542
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,10240,0.022601778308550518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,6144,0.01070666644308302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,8192,0.020237333244747586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,5120,0.01000088867213991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,7168,0.0185208883550432
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,4096,0.009165333376990424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,6144,0.017367111312018502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,3584,0.008330666356616551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,5120,0.015471110741297403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,3072,0.007941332956155142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,4096,0.014112000664075216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,2560,0.007078222102589077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,3584,0.014142221874660917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,1536,0.005886222339338726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,3072,0.013944000005722046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,1024,0.004551110996140374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,2560,0.012749333348539142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,2048,0.01240355521440506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,1536,0.01273333364062839
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,512,0.003882666842805015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,1024,0.012048888537618848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,768,0.011408888631396823
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,512,0.011063999599880643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,128,0.003162666741344664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,256,0.011033777561452655
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,64,0.002489777695801523
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,8192,0.02160088883505927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,32,0.0024871110088295406
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,128,0.01074222226937612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,64,0.009400000174840292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,65536,0.05096266667048136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2560,32,0.009313777916961247
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,51200,0.04073866539531284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,16384,0.01590222285853492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,65536,0.0589688883887397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,51200,0.05862577756245931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,16384,0.024823110964563157
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,10240,0.01204622205760744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,12288,0.023544000254737005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,2048,0.005892444401979446
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,8192,0.011124444504578909
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,7168,0.010391111175219217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,10240,0.020236444142129686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,768,0.004201777693298128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,6144,0.009474666582213508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,8192,0.019160888261265226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,5120,0.008965333302815756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,7168,0.016918222109476726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,3072,256,0.011662222445011139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,4096,0.010204444328943888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2560,256,0.00332622230052948
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,6144,0.015445333388116626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,3584,0.009344889058007134
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,5120,0.014442667365074158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,3072,0.00655644428398874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,2560,0.005949333310127258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,4096,0.014353776971499125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,2048,0.0069217777086628815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,1536,0.005724444571468566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,3584,0.013815999858909182
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,3072,0.013070222404268054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,1024,0.005215999980767568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,2560,0.012459555433856117
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,768,0.004578666554556953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,2048,0.012801777985360889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,512,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,1536,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,256,0.0032355555643637977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,128,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,1024,0.010871999793582492
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,768,0.011426666544543372
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,64,0.0028293333533737394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,32,0.0028888889484935333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,256,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,128,0.01000533335738712
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,64,0.008826666408114964
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,65536,0.037581334511439
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,32,0.009299555586444007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,51200,0.03070311082734002
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,2048,12288,0.013174222575293647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,16384,0.013864888913101621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,12288,0.011356444822417365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,65536,0.056571556462181934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,10240,0.010624888870451184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,51200,0.05104710989528232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,8192,0.010332444475756751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,16384,0.024357333779335022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,12288,0.02087822225358751
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,6144,0.009025777379671732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,10240,0.019911999503771465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,8192,0.016214221715927124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,5120,0.0076044441925154785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,7168,0.015814221567577787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,6144,0.01478844384352366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,5120,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,3584,0.0069448889957533936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,3072,0.006272000157170826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,4096,0.013457777599493662
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,2560,0.005611555443869696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,3584,0.013125333521101209
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,2048,0.005879999862776862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,3072,0.013086222112178802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,1536,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,2560,0.012409778104888068
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,1024,0.004545777622196409
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,2048,0.012059555285506778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,768,0.003915555361244413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,1536,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,512,0.003552888830502828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,1024,0.011085333095656501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,2048,512,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,256,0.0028826666788922418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,768,0.011242667006121742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,512,0.01033688916100396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,256,0.011397333608733283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,64,0.002830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,32,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,128,0.01035288886891471
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,65536,0.026875555515289307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,64,0.009696889254781935
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,7168,0.009360888765917884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1536,32,0.009321778184837764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,51200,0.022248889009157818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,16384,0.01516888870133294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,12288,0.012724444270133972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,65536,0.05404177639219496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,4096,0.008010666403505538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,51200,0.046182221836513944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,10240,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,16384,0.022368000613318548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,8192,0.010178666975763109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,7168,0.009687999884287516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,12288,0.018931556079122756
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,6144,0.008314666648705801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,10240,0.01813066667980618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,5120,0.00798044436507755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,8192,0.01590488851070404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,4096,0.007560888926188151
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,7168,0.015456888410780164
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,3584,0.006628444625271692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,6144,0.01519377695189582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,3072,0.0062977779242727495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,5120,0.01387466655837165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,4096,0.013748444616794586
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,3584,0.013085333009560903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,3072,0.013581333061059317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,2560,0.012411555482281579
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,2048,0.012127999630239276
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1536,128,0.0028764444092909494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,1024,0.0052586665583981415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,1536,0.01148799972401725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,768,0.003903111235962974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,1024,0.011020444333553314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,512,0.003531555748648114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,768,0.011071110765139261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,256,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,512,0.01068800025516086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,128,0.002834666727317704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,256,0.011039111349317761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,64,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,128,0.009668444593747457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,32,0.0028479999552170434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,64,0.009330666727489894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,65536,0.021900445222854614
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,2560,0.005570666657553778
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,2048,0.006578666468461354
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,1024,1536,0.0055440002017551
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,16384,0.010605333579911126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,51200,0.046013332075542875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,12288,0.0107004443804423
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,16384,0.021338666478792827
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,10240,0.009701333112186855
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,12288,0.018734221657117207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,8192,0.009319110876984065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,10240,0.017698667115635343
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,7168,0.008718222379684448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,8192,0.01585244470172458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,6144,0.007958222594526079
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,7168,0.016154666741689045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,5120,0.006931555353932911
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,6144,0.014426666829321118
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,4096,0.007321777443091075
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,5120,0.014674666855070325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,3584,0.006974221931563483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,4096,0.013208889298968844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,3072,0.006582222051090664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,51200,0.018219555417696636
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,2560,0.006610666712125142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,65536,0.05232000019815233
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,3072,0.01274400038851632
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,2048,0.005207111024194294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,1536,0.004998222407367495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,2560,0.013129777378506131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,1024,0.004209777961174647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,2048,0.011711999773979187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,768,0.0038684445122877755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,1536,0.011716444459226398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,512,0.003559999995761447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,1024,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,256,0.0029057777590221832
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,768,0.011008000208271874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,128,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,512,0.010418666733635796
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,256,0.011734222372372946
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,128,0.009927999642160203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,32,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,64,0.009305777649084726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,65536,0.016851555969980028
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,51200,0.014832889040311178
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,32,0.008788444101810455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,16384,0.01070755554570092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,65536,0.052017778158187866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,51200,0.043813334570990674
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,12288,0.008676444490750631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,10240,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,16384,0.020624000165197585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,8192,0.008005333443482717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,1024,32,0.008639111287064022
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,12288,0.01887022289964888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,768,3584,0.013788444300492605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,7168,0.007611555357774098
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,10240,0.01717066599263085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,6144,0.007257777783605788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,5120,0.0069102222720781965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,8192,0.015799999237060547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,4096,0.007277333074145847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,3584,0.006918222126033571
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,7168,0.016207110550668504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,6144,0.01444355481200748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,3072,0.00673333348499404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,5120,0.014492443866199918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,2560,0.006266666783226862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,4096,0.013111111190583972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,2048,0.005919999960396025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,3584,0.013074666261672974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,1536,0.0043333334227403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,3072,0.01274311128589842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,1024,0.0038942222793896994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,2560,0.013032889200581444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,768,0.003571555432346132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,2048,0.011735111474990845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,1536,0.011417778001891242
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,1024,0.011144888897736868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,256,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,768,0.012069332930776807
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,128,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,64,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,512,0.010724444356229572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,256,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,128,0.010056888891590966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,32,0.002540444541308615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,64,0.008664888640244802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,512,32,0.009321778184837764
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,51200,0.013316444224781461
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,65536,0.04859111044141981
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,16384,0.00867022242810991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,51200,0.04110844598876105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,12288,0.008292444050312042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,16384,0.020568889048364427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,10240,0.007640000018808577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,12288,0.01889333294497596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,8192,0.007277333074145847
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,10240,0.016978666186332703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,7168,0.006623999940024481
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,8192,0.016381333271662395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,512,512,0.0031795555518733132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,6144,0.006301333506902059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,7168,0.015189333094490899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,5120,0.006237333433495627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,768,64,0.0028044444819291434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,4096,0.005613333235184352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,3584,0.006296000132958095
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,6144,0.015074667003419666
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,5120,0.013409777647919126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,3072,0.005932444499598608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,2560,0.006020444548792309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,4096,0.013062222136391534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,3584,0.013416888813177744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,2048,0.005919999960396025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,65536,0.014648000399271647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,1536,0.004315555509593752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,3072,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,1024,0.00388711111413108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,2560,0.01312444441848331
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,768,0.0035146665241983202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,2048,0.012456888953844706
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,512,0.0032133333798911837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,1536,0.011381333072980246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,256,0.0031724443866146933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,1024,0.011023110813564725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,128,0.0028168888141711554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,64,0.002487999904486868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,768,0.012074666718641916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,512,0.01109955542617374
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,256,0.01073155552148819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,128,0.009345778160625035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,65536,0.014137778017255994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,64,0.009657777845859528
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,51200,0.012744888663291931
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,256,32,0.008975110948085785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,16384,0.007621333003044128
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,12288,0.007263110743628607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,65536,0.047889779011408486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,10240,0.0069546666410234236
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,51200,0.039713776773876615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,16384,0.020917332834667627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,8192,0.006646222124497096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,12288,0.018198221921920776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,7168,0.006567111031876669
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,6144,0.006256888724035687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,10240,0.016960889101028442
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,5120,0.005888888819350137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,8192,0.016191111670600045
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,4096,0.00553955551650789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,7168,0.01514311134815216
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,6144,0.0141004439857271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,3584,0.005606222069925732
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,3072,0.005566222386227713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,5120,0.013461333182122974
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,2560,0.005589333259397083
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,4096,0.013752889302041797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,3584,0.01277511070171992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,2048,0.005568888866239124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,3072,0.012425777812798819
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,1536,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,2560,0.011749332977665795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,1024,0.003863999827040566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,2048,0.011710222396585675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,768,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,1536,0.011376889215575324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,512,0.0032017777363459268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,256,0.0028444443725877335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,256,32,0.002536000063021978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,1024,0.01073333372672399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,128,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,64,0.002493333278430833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,512,0.010739555789364709
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,128,32,0.002846222163902389
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,256,0.011056889262464313
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,65536,0.010764444039927589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,51200,0.009753777749008602
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,64,0.010010666317409938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,32,0.008634666601816813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,65536,0.04825333423084683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,12288,0.006242666807439592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,51200,0.04061511158943176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,16384,0.020241777102152508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,10240,0.005952888892756567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,12288,0.018575999471876357
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,8192,0.005946666830115848
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,10240,0.016887111796273124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,7168,0.005695111221737332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,8192,0.016150222884284127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,6144,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,7168,0.01514400045077006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,5120,0.0052720002002186244
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,6144,0.014789332946141561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,4096,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,5120,0.013400889105266996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,3584,0.005560889012283749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,768,0.011090666883521609
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,4096,0.013471999930010902
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,3072,0.005615111026499007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,2560,0.005903999838564131
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,3584,0.012805333567990197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,128,128,0.009287111461162567
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,2048,0.005292444593376583
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,3072,0.013087111214796701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,1536,0.00424888895617591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,16384,0.00720888872941335
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,1024,0.003863111138343811
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,2560,0.0124177775449223
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,768,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,2048,0.011728000309732227
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,512,0.0031555555760860443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,1536,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,256,0.0025253333151340485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,128,0.002532444480392668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,768,0.011071999867757162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,512,0.010662222074137794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,64,0.0025253333151340485
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,64,32,0.002529777793420686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,256,0.011017777853541903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,128,0.009318222602208456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,65536,0.009476444787449306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,51200,0.008290666672918532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,64,0.00847111145655314
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,32,0.009360888765917884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,16384,0.006258666515350342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,12288,0.006346666564544042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,65536,0.04789066645834181
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,51200,0.04039555456903245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,16384,0.020291555258962844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,8192,0.005575110928879843
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,10240,0.017232000827789307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,7168,0.005631111148330901
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,8192,0.015576000014940897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,6144,0.005608888963858287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,7168,0.015480000111791821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,5120,0.0052764444715446895
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,6144,0.014111111561457316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,4096,0.0052266667286554975
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,5120,0.014119999276267158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,3584,0.00573600000805325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,4096,0.01311288856797748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,3072,0.005389333185222413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,64,1024,0.011705777711338468
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,2560,0.005950222412745158
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,3584,0.013152889079517789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,2048,0.005586666779385672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,3072,0.012500444220172035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,1536,0.004171555654870139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,2560,0.012778666284349231
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,1024,0.0035573335157500375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,2048,0.012402666939629449
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,768,0.003549333247873518
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,1536,0.011366222467687396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,512,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,1024,0.011396444506115384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,256,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,128,0.0028151110228565005
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,768,0.011727111207114326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,12288,0.01798577772246467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,64,0.0025946667624844448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,512,0.010040000081062317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,256,0.011371555427710215
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,128,0.010344888601038191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,64,0.008328888979223039
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,2,32,32,0.008967111508051554
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,16384,0.3333955605824788
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,16384,0.2348239951663547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,51200,0.5365795559353298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,12288,0.2538355456458198
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,12288,0.19725688298543295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,10240,0.21374932924906412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,51200,1.0049013561672635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,10240,0.13266044192843968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,32,0.002495999965402815
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,8192,0.12438489331139459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,7168,0.1438657840092977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,6144,0.12598844369252524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,7168,0.10964533355500962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,5120,0.1071573363410102
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,6144,0.11467199855380589
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,4096,0.08938488695356582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,3584,0.0732497771581014
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,3072,0.0636026660601298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,3584,0.06548977560467191
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,4096,0.06944088803397284
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,3072,0.057137780719333224
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,2560,0.05234311024347941
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,2,32,10240,0.005576888720194499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,2048,0.042897777424918286
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,8192,0.17390044530232748
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,2560,0.04992444316546122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,1536,0.033131556378470525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,1024,0.023688889212078516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,768,0.018556444181336295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,2048,0.04236533244450887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,512,0.013733333183659447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,1536,0.03526488939921061
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,256,0.008849778109126622
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,768,0.02234399980968899
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,512,0.018600889378123812
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,128,0.006239999913507038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,64,0.005551110953092575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,5120,0.08302666743596394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,65536,32,0.005611555443869696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,256,0.015411555767059326
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,128,0.011712888876597086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,64,0.012450666891203986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,32,0.012431110772821637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,16384,0.24863465627034506
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,51200,0.4563928710089789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,65536,0.5563413302103678
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,51200,0.7491022215949165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,16384,0.15121244059668645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,12288,0.18944177362653944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,65536,1024,0.02625422179698944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,12288,0.15654844707912868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,65536,0.9717111587524414
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,10240,0.15864533848232693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,8192,0.1297724379433526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,7168,0.11367289225260417
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,8192,0.09797600242826675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,6144,0.09894577662150066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,5120,0.09038844373491074
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,7168,0.0878560013241238
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,6144,0.07949511210123698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,5120,0.06782311201095581
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,3584,0.06346933046976726
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,3072,0.05383022295104133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,4096,0.07362044519848294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,2560,0.04568799999025133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,3584,0.05778400103251139
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,3072,0.04931555522812737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,2048,0.03669155637423197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,1536,0.029285334878497656
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,1024,0.02123822271823883
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,1536,0.029669334491093952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,768,0.015509333875444202
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,1024,0.02291822267903222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,2048,0.03895555602179633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,512,0.011333333121405708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,256,0.007263110743628607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,10240,0.10946400298012628
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,768,0.021016889148288306
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,128,0.0038613333470291565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,64,0.0032311110860771606
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,256,0.013779555757840475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,128,0.012072000238630505
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,51200,32,0.0035235554807715942
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,64,0.011735999749766456
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,32,0.012085333466529846
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,65536,0.31940089331732857
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,65536,0.21859199470943877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,51200,0.24664976861741808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,16384,0.08482222424613105
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,2560,0.042881776889165245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,12288,0.06520533561706543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,16384,0.07448622253206041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,10240,0.05617688761817085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,12288,0.060601777500576444
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,8192,0.04386666748258802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,10240,0.05383111039797465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,7168,0.03853955533769395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,8192,0.0417795545525021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,6144,0.033562666840023465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,512,0.01762488815519545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,5120,0.029153777493370905
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,7168,0.040814220905303955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,4096,0.024597333537207708
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,6144,0.03369155526161194
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,3584,0.021309332715140447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,5120,0.032307555278142296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,3072,0.01885333326127794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,2560,0.016514667206340365
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,3584,0.02555466691652934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,3072,0.02462399999300639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,2560,0.022464889619085524
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,51200,4096,0.05818400118086073
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,1536,0.01128355579243766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,1024,0.008838222258620793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,1024,0.015174221661355762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,768,0.006911110960774952
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,1536,0.01768977774514092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,51200,0.16348532835642496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,512,0.00490488898422983
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,768,0.014135999812020196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,256,0.0035093331502543557
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,512,0.012748444245921241
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,128,0.003168888803985384
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,256,0.011040888726711273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,64,0.002826666666401757
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,128,0.010008888940016428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,32,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,64,0.00999466660949919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,4096,0.027622222900390625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,32,0.010018666585286459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,16384,2048,0.014277334014574686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,16384,0.06570400132073297
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,65536,0.24113421969943574
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,51200,0.18653599421183267
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,16384,2048,0.020455999506844413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,65536,0.18852710723876953
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,12288,0.05168977710935804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,51200,0.1496142281426324
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,10240,0.043381333351135254
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,8192,0.03853244582811991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,16384,0.06286578045950995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,10240,0.04734666811095344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,6144,0.029834667841593426
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,12288,0.05201155609554715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,8192,0.03896888759401109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,5120,0.026477333572175767
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,4096,0.022633777724372015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,7168,0.03677689035733541
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,3584,0.020428443948427837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,5120,0.02830222249031067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,3072,0.017860444055663217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,4096,0.02528800070285797
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,2560,0.015447111593352424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,3584,0.025638222694396973
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,3072,0.02306488818592495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,2048,0.01364177796575758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,1536,0.009012444151772393
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,1024,0.007288888924651676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,2560,0.020231111182106864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,2048,0.01884888940387302
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,768,0.0059262220230367445
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,512,0.003801777958869934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,1024,0.014460444450378418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,256,0.0032053333189752367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,768,0.013103110922707452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,512,0.0125591109196345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,256,0.011531555818186866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,64,0.0028088889602157804
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,128,0.00977244476477305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,32,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,64,0.01038044442733129
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,7168,0.03525244527392917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,32,0.00998488896422916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,65536,0.20311200618743896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,6144,0.032199111249711775
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,51200,0.15924533208211264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,65536,0.1665173371632894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,16384,0.05695199966430664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,12288,0.04425155454211765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,10240,0.038189331690470375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,16384,0.05702933337953356
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,51200,0.13535200224982366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,12288,0.04460710949367947
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,8192,0.031553778383466936
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,7168,0.02919911013709174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,12288,1536,0.016608888904253643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,10240,0.040088001224729754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,6144,0.025791111919615004
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,8192,0.03381866547796462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,5120,0.022615111536449854
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,7168,0.03102488981352912
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,4096,0.01921866668595208
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,12288,128,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,3584,0.01854222185081906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,6144,0.02870044443342421
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,3072,0.016864000095261466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,5120,0.025232000483406916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,4096,0.023014222582181294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,2560,0.014471999473041959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,3584,0.021984888447655573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,2048,0.010838222172525195
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,1536,0.009138666921191746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,1024,0.006591111007663939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,3072,0.020012444920010038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,768,0.004914666629499859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,2560,0.01863822175396813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,512,0.0038844446341196695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,2048,0.01779911087618934
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,256,0.0031831111345026228
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,1536,0.015795555379655626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,128,0.0029013332807355454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,768,0.013191111385822296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,64,0.002862222285734283
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,512,0.012083555261294046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,10240,32,0.0028497777465316984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,256,0.010979555547237396
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,128,0.01033866653839747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,64,0.009834667046864828
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,32,0.009024889104896123
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,65536,0.16993599467807344
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,51200,0.12701155079735651
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,65536,0.11567110485500759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,12288,0.034832000732421875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,51200,0.09529511133829753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,16384,0.04259377717971802
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,12288,0.03790488839149475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,8192,0.024439111351966858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,10240,0.031531555785073176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,7168,0.02184533410602146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,8192,0.028763555818133887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,6144,0.019156444403860304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,7168,0.025032889511850145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,5120,0.016559999850061204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,6144,0.02502577834659153
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,4096,0.014946666028764514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,10240,1024,0.01257511145538754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,5120,0.021235555410385132
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,3584,0.013152889079517789
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,3072,0.011380444798204633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,2560,0.010194666683673859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,4096,0.019641778535313077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,3584,0.01886666648917728
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,3072,0.017533333765135873
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,1536,0.007601777712504069
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,2560,0.017151110702090792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,16384,0.04657511247528923
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,1024,0.005663110978073544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,2048,0.014489778214030795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,768,0.004222222086456087
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,512,0.0035342222286595237
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,1536,0.013751111096805997
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,256,0.0032008888406885993
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,10240,0.031142221556769475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,1024,0.013112000293201871
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,768,0.012423111332787408
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,128,0.002847111059559716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,512,0.012256888879670037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,32,0.002526222210791376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,256,0.01072622256146537
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,128,0.009691555466916826
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,64,0.009015111459626092
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,8192,32,0.01000088867213991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,65536,0.14567822880215114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,51200,0.11451200644175212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,16384,0.042169776227739125
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,65536,0.11259644561343723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,12288,0.033195555210113525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,51200,0.0891617801454332
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,10240,0.02838133441077338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,12288,0.034372445609834455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,8192,0.024812445044517517
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,7168,0.01942311061753167
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,8192,0.026515555050637987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,6144,0.01717066599263085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,2048,0.008544888761308458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,7168,0.02535466684235467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,5120,0.014375110467274984
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,4096,0.012864888542228274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,6144,0.02311466634273529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,5120,0.020412445068359375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,3584,0.011370666325092316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,3072,0.01036444471942054
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,4096,0.018927999668651156
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,2560,0.009675555759006077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,8192,64,0.002550222186578645
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,3584,0.018545778261290658
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,2048,0.008028444316652086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,3072,0.017310221989949543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,1536,0.0069102222720781965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,1024,0.004522666749027041
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,2560,0.016978666186332703
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,2048,0.014434667097197639
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,768,0.004190222256713443
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,512,0.0036675557494163513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,1536,0.014451555079884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,1024,0.011728888584507836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,768,0.012666666673289405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,512,0.011778666741318174
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,256,0.01035822182893753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,64,0.00282222218811512
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,128,0.009319110876984065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,32,0.0025475554996066624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,10240,0.02960977620548672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,64,0.009338666995366415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,32,0.009308444129096137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,65536,0.12632977962493896
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,51200,0.09672888782289292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,65536,0.09919733471340603
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,16384,0.03798222210672166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,51200,0.08273244566387601
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,12288,0.02996088729964362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,16384,0.040927112102508545
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,10240,0.02572800053490533
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,12288,0.031346665488349065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,8192,0.0222080002228419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,7168,0.01977244516213735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,10240,0.027648889356189307
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,8192,0.025058666865030926
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,6144,0.01814311080508762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,256,0.0032035555276605818
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,7168,0.02608266638384925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,5120,0.015817777978049386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,7168,128,0.0028080000645584534
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,4096,0.011963555382357704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,6144,0.022628444764349196
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,3584,0.010683555569913654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,5120,0.019902222686343722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,7168,16384,0.04279822111129761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,4096,0.017861333158281114
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,3584,0.018505778577592637
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,2560,0.008619555168681675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,2048,0.007284444239404466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,1536,0.006256000035338932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,2560,0.01550044450494978
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,1024,0.004407111141416761
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,2048,0.013741333451535968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,768,0.0038497779104444715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,1536,0.01418133411142561
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,512,0.003359111025929451
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,1024,0.011876444849703046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,256,0.0031591111587153543
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,768,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,512,0.01219733307758967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,128,0.00286311118139161
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,64,0.0028035555862718155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,256,0.010675555302037133
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,32,0.00249422217408816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,128,0.009690666364298927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,64,0.008968888885445064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,32,0.009656888743241629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,65536,0.1075048910246955
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,51200,0.08374577760696411
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,65536,0.09514844417572021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,16384,0.03320622113015916
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,51200,0.07220266924964057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,12288,0.02680355476008521
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,6144,3072,0.009600888523790572
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,10240,0.023172444767422144
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,16384,0.03906311260329352
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,8192,0.020317332612143624
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,12288,0.02913244565327962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,7168,0.017959111266665988
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,6144,3072,0.01720533271630605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,10240,0.02649066680007511
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,6144,0.016498666670587327
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,5120,0.014472888575659858
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,8192,0.02432800001568264
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,4096,0.010999999940395355
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,6144,0.022755554980701868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,5120,0.018862222631772358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,3584,0.00959644466638565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,3072,0.00885511106914944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,4096,0.01754844519827101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,2560,0.007889777421951294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,3584,0.018216888109842937
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,2048,0.006903111106819577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,3072,0.015792888071801927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,1536,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,1024,0.0038515557017591265
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,2560,0.014633778068754407
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,768,0.003560888684458203
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,2048,0.014107555150985718
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,1536,0.013088888592190213
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,512,0.0035253332720862497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,256,0.0032088889016045462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,1024,0.011367110742463006
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,768,0.011394666300879585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,512,0.011731555892361535
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,64,0.0028373334142896864
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,256,0.01034400032626258
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,32,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,128,0.008665777742862701
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,64,0.009676444033781687
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,65536,0.0897795557975769
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,32,0.009200000100665623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,51200,0.06927377647823758
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,65536,0.0875964429643419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,51200,0.07833066913816664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,12288,0.021114667256673176
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,16384,0.036304887798097395
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,10240,0.018806222412321303
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,8192,0.01648888819747501
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,12288,0.02977422210905287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,10240,0.025607999828126695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,7168,0.015089778436554803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,6144,0.014071111877759298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,8192,0.024718221690919664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,5120,0.012324444121784635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,7168,0.024273778001467388
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,4096,0.011355555719799466
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,6144,0.019612444771660697
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,5120,128,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,3584,0.014072888427310519
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,5120,0.01886488828394148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,3072,0.011015999648306104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,2560,0.009633777870072259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,4096,0.01682844426896837
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,2048,0.009138666921191746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,3072,0.015290665957662793
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,3584,0.016843555702103507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,1536,0.007266666326257918
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,2560,0.014087110757827759
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,1024,0.005564444594913059
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,2048,0.013807999591032663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,1536,0.012440889245933957
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,1024,0.011709333293967776
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,512,0.004176889028814104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,768,0.011707555916574268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,256,0.003060444361633725
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,5120,7168,0.022639999787012737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,128,0.002854222224818336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,512,0.011365333365069495
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,64,0.002519999941190084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,256,0.010173333187898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,32,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,128,0.009677333136399588
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,64,0.00868000007337994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,65536,0.07833955685297649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,4096,32,0.009329777624871995
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,51200,0.06252444452709623
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,65536,0.08216800292332967
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,16384,0.025331555141343012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,51200,0.06332444482379489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,12288,0.019948444432682462
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,10240,0.017463111215167575
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,16384,0.03239288926124573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,8192,0.014997333288192749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,12288,0.028022223048739966
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,7168,0.013781333135233985
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,768,0.0046533333758513136
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,8192,0.021789333886570398
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,6144,0.012609778179062737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,4096,16384,0.027431999643643696
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,7168,0.022052443689770166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,5120,0.011713777979214987
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,4096,0.010506666368908353
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,3584,0.011810666984981961
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,6144,0.018858666221300762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,3072,0.011002666420406766
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,2560,0.009690666364298927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,4096,0.01573955516020457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,5120,0.01681600014368693
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,2048,0.007671111159854465
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,3072,0.013810666898886362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,1536,0.006237333433495627
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,2560,0.01484444406297472
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,1024,0.004881777697139316
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,768,0.004239999999602635
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,2048,0.012706666356987424
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,512,0.0038417776425679526
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,1536,0.012392889294359418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,256,0.002977777686383989
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,1024,0.012111110819710625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,128,0.0028560000161329904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,768,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,512,0.011126221881972419
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,64,0.002532444480392668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,256,0.010010666317409938
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,128,0.009343110852771336
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,64,0.008979555633332994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,65536,0.06886044475767347
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,32,0.008985777695973715
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,51200,0.05518577827347649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,10240,0.024688889582951862
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,16384,0.021703110800849065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,51200,0.06259910927878486
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,12288,0.017567111386193168
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,10240,0.015850666496488783
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,16384,0.02911111050181919
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,8192,0.013758222262064615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,12288,0.026968000663651362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,7168,0.01278133359220293
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,10240,0.02234222160445319
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3584,3584,0.01568800045384301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,6144,0.01203644441233741
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,8192,0.020947555700937908
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,5120,0.010666666759385003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,7168,0.019880000087949965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,4096,0.009768889182143742
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,3584,0.009017777939637503
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,6144,0.01870844430393643
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,5120,0.01683644453684489
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,3072,0.008972444468074376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,4096,0.01477688882086012
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,2560,0.007999999655617608
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,2048,0.006608888920810487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,3584,0.015249777171346875
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,3072,0.013783999615245394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,1536,0.006617777877383762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,1024,0.0052560000783867305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,2560,0.013432888521088494
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,2048,0.012533333566453723
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,768,0.004868444469239977
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,1536,0.012895999683274163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,1024,0.011785777906576792
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,256,0.0035111109415690103
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,768,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,128,0.0031759999692440033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,65536,0.07891555627187093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,256,0.010346666806273991
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,64,0.0028604444944196274
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,128,0.00869333330127928
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,32,0.0028124445428450904
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,64,0.009331555830107795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,65536,0.05868089199066162
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,32,0.008643555144468943
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,51200,0.04694044589996338
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,65536,0.07097066773308648
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,16384,0.01937333411640591
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,51200,0.05847377909554375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,12288,0.015436444017622205
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,16384,0.028043554888831243
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3584,32,0.0028400001012616684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,10240,0.01426488823360867
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,3072,512,0.004193777839342753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,10240,0.021360889077186584
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,7168,0.01146044416560067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,3072,512,0.012028444144460889
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,8192,0.019884443945354886
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,6144,0.01074044406414032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,5120,0.009887999958462184
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,7168,0.019919999771647982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,6144,0.016887111796273124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,4096,0.009311999711725447
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,5120,0.01586933268441094
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,4096,0.014275555809338888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,3072,0.008623999853928884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,3584,0.014469333820872836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,2560,0.00756444450881746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,3072,0.013117333253224691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,2048,0.006575999988449945
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,2560,0.013797333670987023
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,1536,0.006604444649484422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,2048,0.012164444559150271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,1024,0.004872888740566042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,1536,0.012852444416946836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,12288,0.024996444582939148
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,768,0.00453333349691497
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,8192,0.012450666891203986
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,1024,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,256,0.003173333282272021
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,768,0.01130222198035982
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,128,0.0028488888508743713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,512,0.011711111499203576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,64,0.0025537777692079544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,256,0.009732444253232744
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,32,0.0028284444577164124
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,128,0.008970666262838576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,64,0.009392889009581672
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,65536,0.05100533366203308
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,3584,0.008757332960764566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2560,32,0.008655110994974772
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,51200,0.04063644342952304
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,16384,0.016866667403115165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,12288,0.013677332964208392
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,65536,0.06395644611782499
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,10240,0.012311110893885294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,16384,0.027855111493004694
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,12288,0.024506666594081458
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,8192,0.011015999648306104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,7168,0.010308444499969482
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,10240,0.020264888803164165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,6144,0.009709333380063375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,8192,0.019056888090239633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,5120,0.008650666309727563
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,6144,0.015808888607554965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,4096,0.010676444404655032
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2560,512,0.0038737778862317405
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,5120,0.014639111028777229
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,3584,0.009739555418491364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,3072,0.006664888726340399
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,4096,0.014146667387750415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,2560,0.006562666760550604
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,3584,0.013644444445768992
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,2048,0.008276444342401292
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,2560,0.013423999978436364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,1536,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,1024,0.005191111316283544
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,2048,0.01203555530971951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,768,0.004544888933499654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,1536,0.012118221984969245
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,512,0.0038399998512532976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,1024,0.011692444483439127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,256,0.0032702222880389956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,768,0.011360888679822287
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,51200,0.057688891887664795
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,128,0.0028773333049482773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,512,0.011720889144473605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,64,0.0026604444202449587
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,2048,32,0.0028159999185138275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,128,0.008987555901209513
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,64,0.009728888670603434
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,7168,0.0173680004146364
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,32,0.009328888522254096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,51200,0.03049955434269375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,16384,0.013440888788965015
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,65536,0.059763557381100126
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,12288,0.011687111523416309
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,51200,0.04971999923388163
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,16384,0.024704888463020325
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,10240,0.010371555884679159
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,12288,0.021500445074505273
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,3072,0.013094222380055321
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,7168,0.009617778162161509
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,8192,0.016168889072206285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,6144,0.008976000050703684
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,7168,0.015949333707491558
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,5120,0.007735110819339752
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,6144,0.01482222146458096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,4096,0.007278222176763747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,5120,0.014968888627158271
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,3584,0.00720000018676122
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,2048,256,0.010036444498433007
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,4096,0.013136000268989138
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,3072,0.006590222318967183
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,2560,0.005938666562239329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,65536,0.037640889485677086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,3584,0.014073777529928418
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,2048,0.006599111275540457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,3072,0.012438221938080259
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,1536,0.005609777652555042
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,1024,0.004527111020353106
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,2560,0.013396444420019785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,768,0.0038853333228164246
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,1536,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,512,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,768,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,256,0.0028728888266616394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,512,0.011374221907721626
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,128,0.0028195555011431375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,10240,0.018799111247062683
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,64,0.002532444480392668
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,128,0.009662222531106737
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,32,0.00249777775671747
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,64,0.008749333520730337
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,65536,0.026404443714353774
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,32,0.009499555660618676
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,51200,0.02163999941613939
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,65536,0.05849866734610664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,51200,0.047487109899520874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,12288,0.012879999975363413
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,16384,0.02331111166212294
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,10240,0.011718221836619906
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,2048,0.012484444512261285
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,12288,0.018720888429217868
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,8192,0.010969777901967367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,7168,0.009791110952695211
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,1024,0.011027555498811932
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,6144,0.00833333366447025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,8192,0.01579466627703773
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,5120,0.008294222255547842
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,7168,0.015844444433848064
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,4096,0.007320889168315464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1536,8192,0.010116444693671333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,6144,0.014787554740905762
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1536,256,0.010046222143703038
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,5120,0.014085332552591959
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,3072,0.006292444550328785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,2560,0.00554577757914861
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,4096,0.013832888669437833
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,3584,0.013018666870064206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,2048,0.007658667034573025
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,3072,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,2560,0.013443555268976422
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,1024,0.005220444252093633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,2048,0.011726222104496427
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,768,0.004543111142185
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,1536,0.011700444751315646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,512,0.003847111016511917
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,16384,0.014771555860837301
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,768,0.011061333119869232
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,512,0.011378666592968835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,128,0.003012444410059187
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,256,0.009656888743241629
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,64,0.0028213332924577924
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,128,0.009675555759006077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,32,0.0028115556471877625
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,10240,0.016937777400016785
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,64,0.008636444807052612
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,65536,0.022488888767030504
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,51200,0.017832888497246634
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,32,0.009366222553782994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,16384,0.010102222363154093
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,65536,0.053358223703172475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,12288,0.010826666322019366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,51200,0.044228444496790566
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,10240,0.009495110975371467
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,16384,0.021715554926130507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,8192,0.008970666262838576
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,12288,0.018204443984561496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,1536,0.006606222026877933
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,7168,0.00830577810605367
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,10240,0.016751110553741455
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,6144,0.00794933322403166
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,8192,0.015691555208630033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,5120,0.006575111299753189
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,4096,0.007317333585686154
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,7168,0.015847999188635085
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,6144,0.01477866702609592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,3584,0.006948444578382704
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,5120,0.013863999810483722
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,1024,1024,0.011533333195580376
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,3072,0.006659555352396435
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,256,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,2560,0.006226666685607698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,2048,0.005220444252093633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,3584,0.0129439996348487
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,3072,0.01313866674900055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,1536,0.005247999810510212
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,2560,0.01240533341964086
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,1024,0.004242666479614046
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,2048,0.0114720000161065
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,1536,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,512,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,1024,0.010738666686746808
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,768,0.011390222443474663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,512,0.011256888508796692
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,128,0.002867555452717675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,256,0.01036533299419615
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,64,0.0025600000388092464
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,1024,3584,0.006597333484225803
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,32,0.0025519999778932994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,128,0.009337777892748514
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,65536,0.01737866633468204
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,64,0.009333333207501305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,51200,0.014648000399271647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,32,0.009328888522254096
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,16384,0.010672888822025724
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,65536,0.05227466755443149
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,12288,0.008736000292830998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,51200,0.04298133320278592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,10240,0.007663999994595845
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,16384,0.02032177812523312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,8192,0.00794400026400884
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,12288,0.018590221802393597
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,7168,0.007605333295133378
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,10240,0.01682222220632765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,6144,0.007255111303594377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,8192,0.01551822159025404
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,5120,0.0069368887278768755
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,768,0.0039057777159743835
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,7168,0.015799999237060547
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,4096,0.006968888971540663
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,6144,0.014455111490355598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,3584,0.0070675553547011475
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,3072,0.006631111105283101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,5120,0.013761777844693927
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,768,256,0.0028888889484935333
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,2560,0.0063493334584765965
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,2048,0.006250666661394968
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,3584,0.013065777719020844
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,3072,0.012091555529170565
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,2560,0.012094222009181976
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,2048,0.011400889191362592
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,1536,0.011746666497654386
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,768,0.0034933334423436057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,1024,0.010403555300500657
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,512,0.0031804444475306403
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,768,0.011056000159846412
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,256,0.0028640000770489373
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,512,0.01073688848151101
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,128,0.0026684444811609057
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,256,0.009506666825877296
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,768,4096,0.013092444174819522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,64,0.002542222125662698
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,32,0.0024782222592168385
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,128,0.009130666653315226
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,65536,0.01443199978934394
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,64,0.00850577818022834
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,51200,0.01333866682317522
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,32,0.008615111311276754
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,16384,0.008598222500748104
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,65536,0.04863288998603821
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,12288,0.007997333175606197
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,51200,0.040431999497943454
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,512,4096,0.013826666606797112
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,16384,0.020234665936893888
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,10240,0.007263110743628607
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,8192,0.0069573331210348345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,1536,0.004774222357405556
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,7168,0.006599111275540457
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,12288,0.017871111631393433
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,6144,0.006267555471923616
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,10240,0.01759822169939677
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,5120,0.005927111125654644
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,512,1024,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,4096,0.005945777727497949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,7168,0.01479111115137736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,3584,0.0059368887709246735
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,6144,0.014164444473054675
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,5120,0.014447111222479077
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,4096,0.012787555654843649
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,2560,0.005893333504597346
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,2048,0.00591822216908137
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,3584,0.013082666529549493
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,3072,0.01239111108912362
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,1536,0.004553777890072929
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,1024,0.0038568890757030914
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,2560,0.012119111087587146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,2048,0.012387555506494312
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,768,0.0035173334181308746
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,1536,0.011536888778209686
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,512,0.0032275555034478507
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,1024,0.010694222317801582
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,256,0.0028204443968004654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,768,0.011714666253990598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,128,0.0028311111446883944
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,512,0.011403555671374003
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,64,0.002817777709828483
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,256,0.010108444425794814
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,32,0.002500444443689452
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,128,0.009330666727489894
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,65536,0.014102222190962898
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,32,0.009338666995366415
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,51200,0.012383999923865
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,65536,0.048251556025611035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,16384,0.007271111011505127
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,8192,0.015649777319696214
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,12288,0.006928000185224745
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,51200,0.03999200132158067
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,10240,0.0069511110583941145
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,256,3072,0.005937777873542573
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,16384,0.020608888732062448
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,8192,0.006574222197135289
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,7168,0.006265777680608962
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,12288,0.017883555756674874
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,6144,0.005612444546487596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,10240,0.01666755477587382
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,5120,0.005599110904667113
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,8192,0.01588000026014116
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,4096,0.005560889012283749
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,6144,0.014153778553009033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,3584,0.00591555568906996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,5120,0.013624000052611033
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,3072,0.005254222287072076
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,4096,0.01346933344999949
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,2560,0.005952000204059813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,3584,0.012788444757461548
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,3072,0.012067555553383298
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,2560,0.013085333009560903
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,1536,0.00424799985355801
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,2048,0.011376000112957425
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,256,64,0.009363555245929295
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,1024,0.0038480001191298165
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,768,0.0034808889031410217
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,1536,0.012109333442317115
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,512,0.003165333428316646
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,256,0.002833777831660377
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,1024,0.010743111371994019
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,128,0.0028035555862718155
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,512,0.011035555766688453
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,256,0.010031110710567897
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,128,0.009661333428488838
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,32,0.002528888897763358
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,64,0.008993777963850234
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,65536,0.010007999837398529
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,32,0.009366222553782994
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,51200,0.009703999592198266
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,7168,0.01478488908873664
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,16384,0.006959111326270633
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,65536,0.048244443204667836
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,12288,0.005943111247486538
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,51200,0.03970400161213345
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,10240,0.0059004442559348206
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,16384,0.020227554771635268
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,8192,0.006270222365856171
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,12288,0.018204443984561496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,2048,0.005492444253630108
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,7168,0.005903111149867375
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,10240,0.01661333276165856
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,6144,0.005948444621430502
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,8192,0.01516266663869222
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,7168,0.014820444915029736
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,4096,0.005215999980767568
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,6144,0.014276444911956787
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,3584,0.005620444400442972
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,5120,0.013390222357379066
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,3072,0.00556355549229516
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,4096,0.012749333348539142
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,128,768,0.01204533295498954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,2560,0.00591111100382275
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,3584,0.013050666285885705
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,2048,0.005274666680230035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,128,64,0.0024888888001441956
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,3072,0.012050666742854647
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,1536,0.0042071110672420925
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,1024,0.0038364442686239877
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,2560,0.0127368892232577
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,768,0.00351200004418691
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,2048,0.011399110986126794
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,1536,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,1024,0.0107342220014996
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,256,0.0026586666289303037
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,128,0.0025333333760499954
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,768,0.011763555308183035
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,512,0.011358222199810876
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,64,0.0027955555253558685
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,32,0.0026311110705137253
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,256,0.009297777381208207
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,128,0.009309333231714036
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,65536,0.008980444735950893
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,32,0.008349333372380998
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,51200,0.008290666672918532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,65536,0.04760622315936618
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,16384,0.00572533326016532
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,51200,0.03956088754865859
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,5120,0.005612444546487596
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,12288,0.0063457778758472866
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,10240,0.006229333165619109
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,16384,0.020241777102152508
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,8192,0.00527022240890397
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,12288,0.018204443984561496
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,10240,0.016237333416938782
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,8192,0.015465777781274585
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,6144,0.00555644432703654
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,7168,0.01478844384352366
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,5120,0.0052533331844541765
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,64,512,0.0031600000543726813
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,6144,0.014440000057220459
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,4096,0.005201777650250329
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,3584,0.0052639999323421055
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,5120,0.013401777380042605
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,3072,0.005261333452330695
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,4096,0.01274222218328052
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,2560,0.005607111172543631
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,3584,0.012741333080662621
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,2048,0.005225777626037598
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,64,64,0.009333333207501305
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,3072,0.012076444096035428
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,1536,0.004228444563017951
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,1024,0.003495111233658261
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,2048,0.011689778003427716
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,1536,0.011678222152921887
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,768,0.003160888950030009
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,512,0.003154666680428717
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,1024,0.010741333166758219
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,256,0.002806222273243798
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,768,0.011045333411958484
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,128,0.002519999941190084
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,512,0.01074488874938753
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,64,0.00249422217408816
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,256,0.01038933296998342
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,32,0.002549333290921317
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,128,0.008616000413894653
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,float16,1,32,7168,0.005623111294375525
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,64,0.008635555704434713
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,32,0.009314667019579146
VLLM,0.14.1.dev1+gd68209402,NVIDIA B200,gemm,vllm_default,fp8,1,32,2560,0.012108444339699216
